From c1743a52c814377198ec8ee6a22f4487278c57be Mon Sep 17 00:00:00 2001 From: jsmall-nvidia Date: Thu, 12 Mar 2020 15:47:44 -0400 Subject: Vector & Matrix Prefix Sum & Product (#1272) * Implement matrix and vector versions of prefixSum and prefix product. * Comment around how code is organized - where it seems it could be more performant. --- source/slang/hlsl.meta.slang | 4 ++++ 1 file changed, 4 insertions(+) (limited to 'source') diff --git a/source/slang/hlsl.meta.slang b/source/slang/hlsl.meta.slang index 03496ccc8..2b556c10b 100644 --- a/source/slang/hlsl.meta.slang +++ b/source/slang/hlsl.meta.slang @@ -2677,8 +2677,10 @@ __generic __glsl_extension(GL_KHR_shader_subgroup_arithmetic) __spirv_version(1.3) __target_intrinsic(glsl, "subgroupExclusiveMul($0)") +__target_intrinsic(cuda, "_wavePrefixProductMultiple($0)") vector WavePrefixProduct(vector expr); __generic +__target_intrinsic(cuda, "_wavePrefixProductMultiple($0)") matrix WavePrefixProduct(matrix expr); __generic @@ -2691,8 +2693,10 @@ __generic __glsl_extension(GL_KHR_shader_subgroup_arithmetic) __spirv_version(1.3) __target_intrinsic(glsl, "subgroupExclusiveAdd($0)") +__target_intrinsic(cuda, "_wavePrefixSumMultiple($0)") vector WavePrefixSum(vector expr); __generic +__target_intrinsic(cuda, "_wavePrefixSumMultiple($0)") matrix WavePrefixSum(matrix expr); __generic -- cgit v1.2.3