From ff2d490dc120708a2fcb6eea5880a6b7c6586a4b Mon Sep 17 00:00:00 2001 From: Dietrich Geisler Date: Mon, 17 Aug 2020 12:50:44 -0400 Subject: GPU Foreach Loop (#1498) * GPU Foreach Loop This PR introduces the completed GPU foreach loop and updates the heterogeneous-hello-world example to use it. This PR builds on the previous introduction of the GPU Foreach loop parsing and semantic checking PR (#1482) by introducing IR lowering and emmitting. THe new feature can be used by having a GPU_Foreach loop interacting with a named non-CPP entry point, and using the -heterogeneous flag. * Fix to path Co-authored-by: Tim Foley --- source/slang/slang-lower-to-ir.cpp | 32 ++++++++++++++++++++++++++++++++ 1 file changed, 32 insertions(+) (limited to 'source/slang/slang-lower-to-ir.cpp') diff --git a/source/slang/slang-lower-to-ir.cpp b/source/slang/slang-lower-to-ir.cpp index 9c4808f31..864491f7e 100644 --- a/source/slang/slang-lower-to-ir.cpp +++ b/source/slang/slang-lower-to-ir.cpp @@ -4116,7 +4116,39 @@ struct StmtLoweringVisitor : StmtVisitor void visitGpuForeachStmt(GpuForeachStmt* stmt) { + auto builder = getBuilder(); startBlockIfNeeded(stmt); + + auto renderer = getSimpleVal(context, lowerRValueExpr(context, stmt->renderer)); + auto gridDims = getSimpleVal(context, lowerRValueExpr(context, stmt->gridDims)); + + List irArgs; + if (auto callExpr = as(stmt->kernelCall)) + { + irArgs.add(renderer); + irArgs.add(gridDims); + auto fref = getSimpleVal(context, lowerRValueExpr(context, callExpr->functionExpr)); + irArgs.add(fref); + for (auto arg : callExpr->arguments) + { + // if a reference to dispatchThreadID, don't emit + if (auto declRefExpr = as(arg)) + { + if (declRefExpr->declRef.getDecl() == stmt->dispatchThreadID) + { + continue; + } + } + auto irArg = getSimpleVal(context, lowerRValueExpr(context, arg)); + irArgs.add(irArg); + } + } + else + { + SLANG_UNEXPECTED("GPUForeach parsing produced an invalid result"); + } + + builder->emitGpuForeach(irArgs); return; } -- cgit v1.2.3