From 6cee1eeda28c1ce1e5d326a0c43427b4776a1d09 Mon Sep 17 00:00:00 2001 From: Yong He Date: Tue, 8 Jun 2021 07:44:05 -0700 Subject: Various fixes to CUDA backend. (#1877) - Fix emitting `StructuredBuffer::Load`, which triggers emitting for `IROp_WrapExistential` that is previously unhandled. - Fix cuda layout around vectors, they should be aligned to 1,2,4,8,16 bytes instead of just using element type's alignment. That means `float4` has alignment of 16 instead of 4. - Fix `SLANG_CUDA_HANDLE_ERROR` macro definition. - Fix navis sometimes fail to find `Slang::kIROp_*` enum values when debugging external projects. Co-authored-by: Yong He Co-authored-by: jsmall-nvidia --- source/slang/slang-emit-c-like.cpp | 11 +++++++++++ source/slang/slang-ir.cpp | 12 ++++++++++++ source/slang/slang-type-layout.cpp | 16 ++++++++++++++-- source/slang/slang.natvis | 22 +++++++++++----------- tools/gfx/cuda/render-cuda.cpp | 21 +++++++++++++-------- 5 files changed, 61 insertions(+), 21 deletions(-) diff --git a/source/slang/slang-emit-c-like.cpp b/source/slang/slang-emit-c-like.cpp index 1b0fe7c44..47c584251 100644 --- a/source/slang/slang-emit-c-like.cpp +++ b/source/slang/slang-emit-c-like.cpp @@ -1794,6 +1794,17 @@ void CLikeSourceEmitter::defaultEmitInstExpr(IRInst* inst, const EmitOpInfo& inO } break; + case kIROp_WrapExistential: + { + // Normally `WrapExistential` shouldn't exist in user code at this point. + // The only exception is when the user is calling a stdlib generic + // function that has an existential type argument, for example + // `StructuredBuffer.Load()`. + // We can safely ignore the `wrapExistential` operation in this case. + emitOperand(inst->getOperand(0), outerPrec); + } + break; + case kIROp_Select: { diff --git a/source/slang/slang-ir.cpp b/source/slang/slang-ir.cpp index 1f68623bb..90d0181f7 100644 --- a/source/slang/slang-ir.cpp +++ b/source/slang/slang-ir.cpp @@ -6019,3 +6019,15 @@ namespace Slang } } // namespace Slang +#if SLANG_VC +#ifdef _DEBUG +// Natvis sometimes cannot find enum values. +// Export symbols for them to make sure natvis works correctly when debugging external projects. +SLANG_API const int __SlangIROpNameHint = Slang::kIROp_NameHintDecoration; +SLANG_API const int __SlangIROpExport = Slang::kIROp_ExportDecoration; +SLANG_API const int __SlangIROpImport = Slang::kIROp_ImportDecoration; +SLANG_API const int __SlangIROpStringLit = Slang::kIROp_StringLit; +SLANG_API const int __SlangIROpIntLit = Slang::kIROp_IntLit; +#endif +#endif + diff --git a/source/slang/slang-type-layout.cpp b/source/slang/slang-type-layout.cpp index 2568547a4..02b5b5bdc 100644 --- a/source/slang/slang-type-layout.cpp +++ b/source/slang/slang-type-layout.cpp @@ -465,6 +465,18 @@ struct CUDALayoutRulesImpl : DefaultLayoutRulesImpl return arrayInfo; } + // Given `size` between [0, 16] return the smallest power-of-2 that is greater than or equal to `size`. + uint32_t getVectorAlignment(uint32_t size) + { + SLANG_ASSERT(size <= 16); + --size; + // Set every bit after the highest bit. + size |= (size >> 1); + size |= (size >> 2); + ++size; + return size; + } + SimpleLayoutInfo GetVectorLayout(BaseType elementType, SimpleLayoutInfo elementInfo, size_t elementCount) override { // Special case bool @@ -479,8 +491,8 @@ struct CUDALayoutRulesImpl : DefaultLayoutRulesImpl SimpleLayoutInfo vectorInfo; vectorInfo.kind = elementInfo.kind; vectorInfo.size = elementInfo.size * elementCount; - vectorInfo.alignment = elementInfo.alignment; - + vectorInfo.alignment = getVectorAlignment( + (uint32_t)(elementInfo.size.getFiniteValue() * elementCount)); return vectorInfo; } diff --git a/source/slang/slang.natvis b/source/slang/slang.natvis index ea010c187..5af533715 100644 --- a/source/slang/slang.natvis +++ b/source/slang/slang.natvis @@ -83,20 +83,20 @@ - + ((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.chars,[((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.numChars]s8 - + ((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.chars,[((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.numChars]s8 - + ((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.chars,[((Slang::IRStringLit*)(((Slang::IRUse*)(child + 1))->usedValue))->value.stringVal.numChars]s8 child = child->next - ((IRStringLit*)this)->value.stringVal.chars,[((IRStringLit*)this)->value.stringVal.numChars]s8 - ((IRIntLit*)this)->value.intVal + ((IRStringLit*)this)->value.stringVal.chars,[((IRStringLit*)this)->value.stringVal.numChars]s8 + ((IRIntLit*)this)->value.intVal