summaryrefslogtreecommitdiffstats
path: root/source/slang/emit.cpp
diff options
context:
space:
mode:
authorTim Foley <tfoley@nvidia.com>2017-12-21 16:16:23 -0800
committerTim Foley <tfoley@nvidia.com>2017-12-21 16:16:23 -0800
commit00490154ef0762839556b5884ba9b7523b265a1c (patch)
tree239e42c6e9fd2907afe52974cccda41555bde2ba /source/slang/emit.cpp
parent6f681279d99e72e717bb2b91763b80e570ae725b (diff)
Support generic `struct` types during IR-based emit
Fixes #318 Most of the required support was actually in place, so this is just a bunch of fixes: - Detect when we are in "full IR" mode, so that we can always emit `struct` declarations with their mangled named (which will produce different names for different specializations, since we emit decl-refs) - Carefully exclude builtin types from this for now. We'll need a more complete solution for mapping HLSL/Slang builtin types to their GLSL equivalents soon. - Skip emitting types referenced by generic IR functions, since they might not be usable. - Also fix things up so that we emit types used in the initializer for any global variables. - Fix bug in generic specialization where we specialize the same function more than once, with different type arguments. We were crashing on a `Dictionary::Add` call where the key already exists from a previous specialization attempt. - Fix name-mangling logic so that when outputting a possibly-specialized generic it looks for the outer-most `GenericSubstitution` rather than just the first one in the list. This is to handle the way that we insert other substitutions willy-nilly in places where they realistically don't belong. :( All of these changes together allow us to pass a slightly modified (more advanced) version of the test case posted to #318.
Diffstat (limited to 'source/slang/emit.cpp')
-rw-r--r--source/slang/emit.cpp104
1 files changed, 81 insertions, 23 deletions
diff --git a/source/slang/emit.cpp b/source/slang/emit.cpp
index 5cd0ea832..e9a2588d5 100644
--- a/source/slang/emit.cpp
+++ b/source/slang/emit.cpp
@@ -116,6 +116,10 @@ struct SharedEmitContext
// Map used to tell AST lowering what decls are represented by IR.
HashSet<Decl*>* irDeclSetForAST = nullptr;
+
+ // Are we doing IR-only emit, so that everything should get
+ // its mangled name?
+ bool isFullIRMode = false;
};
struct EmitContext
@@ -2996,10 +3000,21 @@ struct EmitVisitor
}
}
+ bool isBuiltinDecl(Decl* decl)
+ {
+ for (auto dd = decl; dd; dd = dd->ParentDecl)
+ {
+ if (dd->FindModifier<FromStdLibModifier>())
+ return true;
+ }
+ return false;
+ }
+
void EmitDeclRef(DeclRef<Decl> declRef)
{
// Are we emitting an AST in a context where some declarations
// are actually stored as IR code?
+
if(auto irDeclSet = context->shared->irDeclSetForAST)
{
Decl* decl = declRef.getDecl();
@@ -3010,6 +3025,17 @@ struct EmitVisitor
}
}
+ if (context->shared->isFullIRMode)
+ {
+ // Don't apply this to builting declarations
+ if (!isBuiltinDecl(declRef.getDecl()))
+ {
+ emit(getIRName(declRef));
+ return;
+ }
+ }
+
+
// TODO: need to qualify a declaration name based on parent scopes/declarations
@@ -4453,26 +4479,34 @@ emitDeclImpl(decl, nullptr);
String getIRName(DeclRefBase const& declRef)
{
- // It is a bit ugly, but we need a deterministic way
- // to get a name for things when emitting from the IR
- // that won't conflict with any keywords, builtins, etc.
- // in the target language.
+ // In general, when referring to a declaration that has been lowered
+ // via the IR, we want to use its mangled name.
+ //
+ // There are two main exceptions to this:
+ //
+ // 1. For debugging, we accept the `-no-mangle` flag which basically
+ // instructs us to try to use the original name of all declarations,
+ // to make the output more like what is expected to come out of
+ // fxc pass-through. This case should get deprecated some day.
//
- // Eventually we should accomplish this by using
- // mangled names everywhere, but that complicates things
- // when we are also using direct comparison to fxc/glslang
- // output for some of our tests.
+ // 2. It is really annoying to have the fields of a `struct` type
+ // get ridiculously lengthy mangled names, and this also messes
+ // up stuff like specialization (since the mangled name of a field
+ // would then include the mangled name of the outer type).
//
String name;
if (context->shared->entryPoint->compileRequest->compileFlags & SLANG_COMPILE_FLAG_NO_MANGLING)
{
+ // Special case (1):
name.append(getText(declRef.GetName()));
+ return name;
}
- else
- {
- name.append(getMangledName(declRef));
- }
+
+ // Special case (2): not implemented yet.
+
+ // General case:
+ name.append(getMangledName(declRef));
return name;
}
@@ -7040,6 +7074,24 @@ emitDeclImpl(decl, nullptr);
{}
}
+ void emitIRUsedTypesForGlobalValueWithCode(
+ EmitContext* ctx,
+ IRGlobalValueWithCode* value)
+ {
+ for( auto bb = value->getFirstBlock(); bb; bb = bb->getNextBlock() )
+ {
+ for( auto pp = bb->getFirstParam(); pp; pp = pp->getNextParam() )
+ {
+ emitIRUsedTypesForValue(ctx, pp);
+ }
+
+ for( auto ii = bb->getFirstInst(); ii; ii = ii->getNextInst() )
+ {
+ emitIRUsedTypesForValue(ctx, ii);
+ }
+ }
+ }
+
void emitIRUsedTypesForValue(
EmitContext* ctx,
IRValue* value)
@@ -7050,19 +7102,23 @@ emitDeclImpl(decl, nullptr);
case kIROp_Func:
{
auto irFunc = (IRFunc*) value;
+
+ // Don't emit anything for a generic function,
+ // since we only care about the types used by
+ // the actual specializations.
+ if (irFunc->genericDecl)
+ return;
+
emitIRUsedType(ctx, irFunc->getResultType());
- for( auto bb = irFunc->getFirstBlock(); bb; bb = bb->getNextBlock() )
- {
- for( auto pp = bb->getFirstParam(); pp; pp = pp->getNextParam() )
- {
- emitIRUsedTypesForValue(ctx, pp);
- }
- for( auto ii = bb->getFirstInst(); ii; ii = ii->getNextInst() )
- {
- emitIRUsedTypesForValue(ctx, ii);
- }
- }
+ emitIRUsedTypesForGlobalValueWithCode(ctx, irFunc);
+ }
+ break;
+
+ case kIROp_global_var:
+ {
+ auto irGlobal = (IRGlobalVar*) value;
+ emitIRUsedTypesForGlobalValueWithCode(ctx, irGlobal);
}
break;
@@ -7372,6 +7428,8 @@ String emitEntryPoint(
// compilation work. We thus start by cloning any code needed
// by the entry point over to our fresh IR module.
+ sharedContext.isFullIRMode = true;
+
specializeIRForEntryPoint(
irSpecializationState,
entryPoint);