diff options
| author | Sai Praveen Bangaru <31557731+saipraveenb25@users.noreply.github.com> | 2023-09-18 23:45:44 -0400 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2023-09-18 20:45:44 -0700 |
| commit | 95fcf65c38d52ed458a3b11622ea8b55a3864c24 (patch) | |
| tree | 5f07d03893504367466a278d7a1bcf63d4372c57 | |
| parent | e884b153f8c29438b818d9930b8342e5ac8f829f (diff) | |
Fix loop inversion issue that caused ordinary blocks with multiple predecessors (#3211)
* Add test case for while loop
* Fix loop inversion issue that caused ordinary blocks with multiple predecessors
The original version can leave the CFG in an invalid state with `e4` not being a break block or merge point, but having multiple predecessors.
The updated version creates a separate jump block for each break instruction to avoid this issue.
* Fixup tests
| -rw-r--r-- | source/slang/slang-ir-loop-inversion.cpp | 42 | ||||
| -rw-r--r-- | tests/autodiff/reverse-while-loop-3.slang | 66 | ||||
| -rw-r--r-- | tests/autodiff/reverse-while-loop-3.slang.expected.txt | 6 |
3 files changed, 90 insertions, 24 deletions
diff --git a/source/slang/slang-ir-loop-inversion.cpp b/source/slang/slang-ir-loop-inversion.cpp index 9d2f13877..e2f9b435c 100644 --- a/source/slang/slang-ir-loop-inversion.cpp +++ b/source/slang/slang-ir-loop-inversion.cpp @@ -118,19 +118,22 @@ static IRParam* duplicateToParamWithDecorations(IRBuilder& builder, IRCloneEnv& // s: ...1 goto c2 // c2: if x then goto e2 else goto l (merge at b) // e2: goto b -// l: loop break=b next=d +// l: loop break=b2 next=d // d: goto c1: // c1: if x then goto e1 else goto e3 (merge at e3) // e3: goto d -// e1: goto b +// e1: goto b2 +// b2: goto b // b: ...2 // // s is the Start block // c1, c2 are the Condition blocks // e1, e2, e3 are the critical Edge breakers -// l is the Loop entering block -// d is the loop boDy -// b is the Break block +// l is the loop entering block +// d is the loop body +// b is the merge point for the outer condition +// b2 is the new break block for the loop +// static void invertLoop(IRBuilder& builder, IRLoop* loop) { IRBuilderInsertLocScope builderScope(&builder); @@ -195,25 +198,23 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) c1bUse.set(e1); c1Terminator->afterBlock.set(d); - // We create another block e4 to handle other breaks from inside the loop, and - // rewrite existing breaks to jump to it. - // We keep e4 and e1 distinct since after the inversion step, insts in e4 will - // be re-written to use values from the loop entry, while e1 will use values from - // c1. + // We'll rewrite existing breaks to jump to b2, but via an intermediate jump block to + // avoid a critical edge. // - auto e4 = builder.emitBlock(); - e4->insertBefore(c1); - builder.emitBranch(b2, c1Params.getCount(), c1Params.getBuffer()); traverseUses(b, [&](IRUse* u){ auto userBlock = u->getUser()->getParent(); // Restrict this to just those blocks within this loop - if(userBlock != e4 && userBlock != e1 && userBlock != b2 && domTree->dominates(s, userBlock) && !domTree->dominates(b, userBlock)) - u->set(e4); + if(userBlock != e1 && userBlock != b2 && domTree->dominates(s, userBlock) && !domTree->dominates(b, userBlock)) + { + auto jumpToB2Block = builder.emitBlock(); + jumpToB2Block->insertAfter(userBlock); + builder.emitBranch(b2, c1Params.getCount(), c1Params.getBuffer()); + u->set(jumpToB2Block); + } }); // We now have // s: ...1 loop break=b next=c1 - // e4: goto b2 // c1: if x then goto e1 else goto d (merge at d) // e1: goto b2 // d: goto c1 @@ -238,7 +239,6 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) // We now have // s: ...1 loop break=b next=c1 - // e4: goto b2 // c2: if x then goto e2 else goto d (merge at b) // e2: goto b // c1: if x then goto e1 else goto d (merge at d) @@ -251,13 +251,11 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) const auto l = builder.emitBlock(); l->insertAfter(e2); loop->insertAtEnd(l); - e4->insertBefore(c1); // We now have // s: ...1 no-termiator // c2: if x then goto e2 else goto d (merge at b) // e2: goto b // l: loop break=b next=c1 - // e4: goto b2 // c1: if x then goto e1 else goto d (merge at d) // e1: goto b2 // d: goto c1 @@ -276,7 +274,6 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) // c2: if x then goto e2 else goto d (merge at b) // e2: goto b // l: loop break=b next=c1 - // e4: goto b2 // c1: if x then goto e1 else goto d (merge at d) // e1: goto b2 // d: goto c1 @@ -291,7 +288,6 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) // c2: if x then goto e2 else goto l (merge at b) // e2: goto b // l: loop break=b next=c1 - // e4: goto b2 // c1: if x then goto e1 else goto d (merge at d) // e1: goto b2 // d: goto c1 @@ -336,7 +332,6 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) const auto e3 = builder.emitBlock(); e3->insertAfter(c1); b2->insertBefore(b); - e4->insertAfter(c1); builder.emitBranch(d, ps.getCount(), ps.getBuffer()); c1dUse.set(e3); c1Terminator->afterBlock.set(e3); @@ -346,12 +341,11 @@ static void invertLoop(IRBuilder& builder, IRLoop* loop) // e2: goto b // l: loop break=b2 next=d // d: goto c1 - // e4: goto b2 // c1: if x then goto e1 else goto e3 (merge at e3) // e3: goto d // e1: goto b2 // b2: goto b - // b: ...2 + // b: ...2 } bool invertLoops(IRModule* module) diff --git a/tests/autodiff/reverse-while-loop-3.slang b/tests/autodiff/reverse-while-loop-3.slang new file mode 100644 index 000000000..67f030030 --- /dev/null +++ b/tests/autodiff/reverse-while-loop-3.slang @@ -0,0 +1,66 @@ +//TEST(compute):COMPARE_COMPUTE_EX:-slang -compute -shaderobj -output-using-type +//TEST(compute, vulkan):COMPARE_COMPUTE_EX:-vk -compute -shaderobj -output-using-type +//TEST(compute):COMPARE_COMPUTE_EX:-cpu -compute -output-using-type -shaderobj + +//TEST_INPUT:ubuffer(data=[0 0 0 0 0], stride=4):out,name=outputBuffer +RWStructuredBuffer<float> outputBuffer; + +// This test isn't actually testing the output, but rather that the compiler doesn't crash upon +// encountering a specific loop pattern. ('Data' is non-differentiable here, so the expected output is 0)s +// + +typedef DifferentialPair<float> dpfloat; +typedef float.Differential dfloat; + +struct P +{ + bool terminated; + bool isTerminated() { return terminated; } + bool isHit() { return !terminated; } +}; + +struct Data +{ + float t; +}; + +void updateData(Data data) +{ + data.t = data.t * data.t; +} + +[BackwardDifferentiable] +float test_simple_while(float y, uint n) +{ + Data d = { y }; + P p; + p.terminated = false; + int i = n; + + if (p.isTerminated()) + return d.t; + + [MaxIters(4)] + while (!p.isTerminated()) + { + updateData(d); + p.terminated = (i-- == 0); + if (p.isTerminated()) + break; + + if (!p.isHit()) + break; + } + return d.t; +} + +[numthreads(1, 1, 1)] +void computeMain(uint3 dispatchThreadID : SV_DispatchThreadID) +{ + { + dpfloat dpa = dpfloat(1.0, 0.0); + + __bwd_diff(test_simple_while)(dpa, 2, 1.0f); + outputBuffer[0] = dpa.d; // Expect: 8.0 + } +} diff --git a/tests/autodiff/reverse-while-loop-3.slang.expected.txt b/tests/autodiff/reverse-while-loop-3.slang.expected.txt new file mode 100644 index 000000000..ca54c9afe --- /dev/null +++ b/tests/autodiff/reverse-while-loop-3.slang.expected.txt @@ -0,0 +1,6 @@ +type: float +1.000000 +0.000000 +0.000000 +0.000000 +0.000000 |
