From 7561ffb3e7d4d55f1a4cf786319e7a07f204a9e3 Mon Sep 17 00:00:00 2001 From: Sai Praveen Bangaru <31557731+saipraveenb25@users.noreply.github.com> Date: Wed, 7 Jun 2023 00:16:19 -0400 Subject: AD: Fix out-of-scope indexing rules for insts in loop header blocks during the primal-inst availability pass (#2918) * add test case * Fix out-of-scope indexing rules for loop header blocks --------- Co-authored-by: Yong He Co-authored-by: Yong He --- source/slang/slang-ir-autodiff-primal-hoist.cpp | 28 ++++++++++++++++++------- source/slang/slang-ir-autodiff-primal-hoist.h | 6 ++++++ 2 files changed, 27 insertions(+), 7 deletions(-) (limited to 'source') diff --git a/source/slang/slang-ir-autodiff-primal-hoist.cpp b/source/slang/slang-ir-autodiff-primal-hoist.cpp index 0016f25e3..6947fd7c5 100644 --- a/source/slang/slang-ir-autodiff-primal-hoist.cpp +++ b/source/slang/slang-ir-autodiff-primal-hoist.cpp @@ -961,6 +961,7 @@ IRInst* emitIndexedStoreAddressForVar( IRInst* emitIndexedLoadAddressForVar( IRBuilder* builder, IRVar* localVar, + IRBlock* defBlock, const List& defBlockIndices, const List& useBlockIndices) { @@ -986,12 +987,15 @@ IRInst* emitIndexedLoadAddressForVar( { // If the use-block is outside this region, use the // last available value (by indexing with primal counter minus 1) + // An exception is if the stored inst is in a loop header block where + // we use counter directly (since that block runs N+1 times) // auto primalCounterCurrValue = index.primalCountParam; - auto primalCounterLastValue = builder->emitSub( - primalCounterCurrValue->getDataType(), - primalCounterCurrValue, - builder->getIntValue(builder->getIntType(), 1)); + auto primalCounterLastValue = (index.loopHeaderBlock == defBlock) ? primalCounterCurrValue : + builder->emitSub( + primalCounterCurrValue->getDataType(), + primalCounterCurrValue, + builder->getIntValue(builder->getIntType(), 1)); loadAddr = builder->emitElementAddress( builder->getPtrType(currType), @@ -1021,10 +1025,11 @@ IRVar* storeIndexedValue( IRInst* loadIndexedValue( IRBuilder* builder, IRVar* localVar, + IRBlock* defBlock, const List& defBlockIndices, const List& useBlockIndices) { - IRInst* addr = emitIndexedLoadAddressForVar(builder, localVar, defBlockIndices, useBlockIndices); + IRInst* addr = emitIndexedLoadAddressForVar(builder, localVar, defBlock, defBlockIndices, useBlockIndices); return builder->emitLoad(addr); } @@ -1292,7 +1297,12 @@ RefPtr ensurePrimalAvailability( List& useBlockIndices = indexedBlockInfo[getBlock(use->getUser())]; - IRInst* loadAddr = emitIndexedLoadAddressForVar(&builder, localVar, defBlockIndices, useBlockIndices); + IRInst* loadAddr = emitIndexedLoadAddressForVar( + &builder, + localVar, + defBlock, + defBlockIndices, + useBlockIndices); builder.replaceOperand(use, loadAddr); } @@ -1323,7 +1333,9 @@ RefPtr ensurePrimalAvailability( { List useBlockIndices = indexedBlockInfo[getBlock(use->getUser())]; setInsertBeforeOrdinaryInst(&builder, getInstInBlock(use->getUser())); - builder.replaceOperand(use, loadIndexedValue(&builder, localVar, defBlockIndices, useBlockIndices)); + builder.replaceOperand( + use, + loadIndexedValue(&builder, localVar, defBlock, defBlockIndices, useBlockIndices)); } if (!isRecomputeInst) @@ -1512,6 +1524,8 @@ void buildIndexedBlocks( IndexTrackingInfo indexInfo = {}; lowerIndexedRegion(primalLoop, loop, indexInfo.primalCountParam, indexInfo.diffCountParam); + indexInfo.loopHeaderBlock = getLoopConditionBlock(primalLoop); + SLANG_RELEASE_ASSERT(indexInfo.primalCountParam); SLANG_RELEASE_ASSERT(indexInfo.diffCountParam); diff --git a/source/slang/slang-ir-autodiff-primal-hoist.h b/source/slang/slang-ir-autodiff-primal-hoist.h index c9377d56b..59c70e862 100644 --- a/source/slang/slang-ir-autodiff-primal-hoist.h +++ b/source/slang/slang-ir-autodiff-primal-hoist.h @@ -211,6 +211,12 @@ namespace Slang IRInst* primalCountParam = nullptr; IRInst* diffCountParam = nullptr; + // Reference to the header block. Note that the header block + // typically contains the loop condition and is executed N+1 + // times if the loop body is executed N times. + // + IRBlock* loopHeaderBlock = nullptr; + enum CountStatus { Unresolved, -- cgit v1.2.3