diff options
| author | Konstantin <const@const.me> | 2023-01-24 17:40:50 +0100 |
|---|---|---|
| committer | Konstantin <const@const.me> | 2023-01-24 17:40:50 +0100 |
| commit | e78815de53005336c3746bcd85c2e789a43f1b94 (patch) | |
| tree | 5fe25b6d4024bbcca7402ebcc28910417c54758d /ComputeShaders | |
| parent | 9d6fb00973218ebc397e15819be3964423b81f91 (diff) | |
Performance tuning on AMD iGPU
Diffstat (limited to 'ComputeShaders')
| -rw-r--r-- | ComputeShaders/ComputeShaders.vcxproj | 2 | ||||
| -rw-r--r-- | ComputeShaders/ComputeShaders.vcxproj.filters | 2 | ||||
| -rw-r--r-- | ComputeShaders/mulMatByRowTiled64.hlsl | 4 | ||||
| -rw-r--r-- | ComputeShaders/mulMatByRowTiledEx.hlsl | 2 | ||||
| -rw-r--r-- | ComputeShaders/mulMatTiled64.hlsl | 3 | ||||
| -rw-r--r-- | ComputeShaders/mulMatTiledEx.hlsl | 2 |
6 files changed, 2 insertions, 13 deletions
diff --git a/ComputeShaders/ComputeShaders.vcxproj b/ComputeShaders/ComputeShaders.vcxproj index 300974a..b79f550 100644 --- a/ComputeShaders/ComputeShaders.vcxproj +++ b/ComputeShaders/ComputeShaders.vcxproj @@ -184,14 +184,12 @@ <FxCompile Include="mulMatByRow.hlsl" /> <FxCompile Include="mulMatByRow64.hlsl" /> <FxCompile Include="mulMatByRowTiled.hlsl" /> - <FxCompile Include="mulMatByRowTiled64.hlsl" /> <FxCompile Include="mulMatByRowTiledEx.hlsl" /> <FxCompile Include="mulMatByScalar.hlsl" /> <FxCompile Include="mulMatDotMain.hlsl" /> <FxCompile Include="mulMatDotReshape.hlsl" /> <FxCompile Include="mulMatMadMain.hlsl" /> <FxCompile Include="mulMatTiled.hlsl" /> - <FxCompile Include="mulMatTiled64.hlsl" /> <FxCompile Include="mulMatTiledEx.hlsl" /> <FxCompile Include="norm.hlsl" /> <FxCompile Include="normCompat.hlsl" /> diff --git a/ComputeShaders/ComputeShaders.vcxproj.filters b/ComputeShaders/ComputeShaders.vcxproj.filters index de9f12f..fbf30d6 100644 --- a/ComputeShaders/ComputeShaders.vcxproj.filters +++ b/ComputeShaders/ComputeShaders.vcxproj.filters @@ -43,9 +43,7 @@ <FxCompile Include="normFixed64.hlsl" /> <FxCompile Include="mulMatByRowTiled.hlsl" /> <FxCompile Include="convolutionMain2Fixed.hlsl" /> - <FxCompile Include="mulMatByRowTiled64.hlsl" /> <FxCompile Include="addRows.hlsl" /> - <FxCompile Include="mulMatTiled64.hlsl" /> <FxCompile Include="zeroMemory.hlsl" /> <FxCompile Include="mulMatTiledEx.hlsl" /> <FxCompile Include="matReshapePanels.hlsl" /> diff --git a/ComputeShaders/mulMatByRowTiled64.hlsl b/ComputeShaders/mulMatByRowTiled64.hlsl deleted file mode 100644 index 6c63f2d..0000000 --- a/ComputeShaders/mulMatByRowTiled64.hlsl +++ /dev/null @@ -1,4 +0,0 @@ -#define THREADS_Y 32 -#define THREADS_X 32 -#define TILE_Y 128 -#include "mulMatByRowTiled.hlsl"
\ No newline at end of file diff --git a/ComputeShaders/mulMatByRowTiledEx.hlsl b/ComputeShaders/mulMatByRowTiledEx.hlsl index bc0c0c6..d286ec2 100644 --- a/ComputeShaders/mulMatByRowTiledEx.hlsl +++ b/ComputeShaders/mulMatByRowTiledEx.hlsl @@ -3,7 +3,7 @@ static const uint TILE_SIZE = 32; #endif #ifndef THREADS_Y -static const uint THREADS_Y = 16; +static const uint THREADS_Y = 8; #endif // First tensor, reshaped into dense column major horizontal panels of size [ width, TILE_SIZE ] diff --git a/ComputeShaders/mulMatTiled64.hlsl b/ComputeShaders/mulMatTiled64.hlsl deleted file mode 100644 index 45d77b1..0000000 --- a/ComputeShaders/mulMatTiled64.hlsl +++ /dev/null @@ -1,3 +0,0 @@ -#define TILE_SIZE 64 -#define STREAM_SECOND_MATRIX 1 -#include "mulMatTiled.hlsl"
\ No newline at end of file diff --git a/ComputeShaders/mulMatTiledEx.hlsl b/ComputeShaders/mulMatTiledEx.hlsl index e6d6940..c59e3ea 100644 --- a/ComputeShaders/mulMatTiledEx.hlsl +++ b/ComputeShaders/mulMatTiledEx.hlsl @@ -6,7 +6,7 @@ static const uint TILE_SIZE = 32; #endif #ifndef TILE_HEIGHT -static const uint TILE_HEIGHT = 32; +static const uint TILE_HEIGHT = 64; #endif #ifndef THREADS_Y static const uint THREADS_Y = 8; |
