From 0d21b7cbdeb2f2eb5ef123a15099da0b651b24c0 Mon Sep 17 00:00:00 2001 From: Alexey Bataev Date: Mon, 17 Jul 2023 09:47:01 -0700 Subject: [PATCH] [SLP][NFC]Improve compile-time by using map {TreeEntry *, Instruction *} in getLastInstructionInBundle(), NFC. Instead of building EntryToLastInstruction before the vectorization, build it automatically during the calls to getLastInstructionInBundle() function. --- llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp | 43 +++++++++---------------- 1 file changed, 15 insertions(+), 28 deletions(-) diff --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp index a5a9f00..5249071 100644 --- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp +++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp @@ -8992,6 +8992,9 @@ void BoUpSLP::reorderInputsAccordingToOpcode( } Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { + auto &Res = EntryToLastInstruction.FindAndConstruct(E); + if (Res.second) + return *Res.second; // Get the basic block this bundle is in. All instructions in the bundle // should be in this block (except for extractelement-like instructions with // constant indeces). @@ -9006,7 +9009,7 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { isVectorLikeInstWithConstOps(I); })); - auto &&FindLastInst = [E, Front, this, &BB]() { + auto FindLastInst = [&]() { Instruction *LastInst = Front; for (Value *V : E->Scalars) { auto *I = dyn_cast(V); @@ -9042,7 +9045,7 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { return LastInst; }; - auto &&FindFirstInst = [E, Front, this]() { + auto FindFirstInst = [&]() { Instruction *FirstInst = Front; for (Value *V : E->Scalars) { auto *I = dyn_cast(V); @@ -9082,7 +9085,6 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { if (doesNotNeedToSchedule(E->Scalars) || (E->State != TreeEntry::NeedToGather && all_of(E->Scalars, isVectorLikeInstWithConstOps))) { - Instruction *InsertInst; if ((E->getOpcode() == Instruction::GetElementPtr && any_of(E->Scalars, [](Value *V) { @@ -9091,15 +9093,12 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { all_of(E->Scalars, [](Value *V) { return !isVectorLikeInstWithConstOps(V) && isUsedOutsideBlock(V); })) - InsertInst = FindLastInst(); + Res.second = FindLastInst(); else - InsertInst = FindFirstInst(); - return *InsertInst; + Res.second = FindFirstInst(); + return *Res.second; } - // The last instruction in the bundle in program order. - Instruction *LastInst = nullptr; - // Find the last instruction. The common case should be that BB has been // scheduled, and the last instruction is VL.back(). So we start with // VL.back() and iterate over schedule data until we reach the end of the @@ -9112,7 +9111,7 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { if (Bundle && Bundle->isPartOfBundle()) for (; Bundle; Bundle = Bundle->NextInBundle) if (Bundle->OpValue == Bundle->Inst) - LastInst = Bundle->Inst; + Res.second = Bundle->Inst; } // LastInst can still be null at this point if there's either not an entry @@ -9133,15 +9132,15 @@ Instruction &BoUpSLP::getLastInstructionInBundle(const TreeEntry *E) { // not ideal. However, this should be exceedingly rare since it requires that // we both exit early from buildTree_rec and that the bundle be out-of-order // (causing us to iterate all the way to the end of the block). - if (!LastInst) - LastInst = FindLastInst(); - assert(LastInst && "Failed to find last instruction in bundle"); - return *LastInst; + if (!Res.second) + Res.second = FindLastInst(); + assert(Res.second && "Failed to find last instruction in bundle"); + return *Res.second; } void BoUpSLP::setInsertPointAfterBundle(const TreeEntry *E) { auto *Front = E->getMainOp(); - Instruction *LastInst = EntryToLastInstruction.lookup(E); + Instruction *LastInst = &getLastInstructionInBundle(E); assert(LastInst && "Failed to find last instruction in bundle"); // If the instruction is PHI, set the insert point after all the PHIs. bool IsPHI = isa(LastInst); @@ -9662,7 +9661,7 @@ Value *BoUpSLP::vectorizeOperand(TreeEntry *E, unsigned NodeIdx) { IRBuilder<>::InsertPointGuard Guard(Builder); if (E->getOpcode() != Instruction::InsertElement && E->getOpcode() != Instruction::PHI) { - Instruction *LastInst = EntryToLastInstruction.lookup(E); + Instruction *LastInst = &getLastInstructionInBundle(E); assert(LastInst && "Failed to find last instruction in bundle"); Builder.SetInsertPoint(LastInst); } @@ -10682,18 +10681,6 @@ Value *BoUpSLP::vectorizeTree( scheduleBlock(BSIter.second.get()); } - // Pre-gather last instructions. - for (const std::unique_ptr &E : VectorizableTree) { - if ((E->State == TreeEntry::NeedToGather && - (!E->getMainOp() || E->Idx > 0)) || - (E->State != TreeEntry::NeedToGather && - E->getOpcode() == Instruction::ExtractValue) || - E->getOpcode() == Instruction::InsertElement) - continue; - Instruction *LastInst = &getLastInstructionInBundle(E.get()); - EntryToLastInstruction.try_emplace(E.get(), LastInst); - } - Builder.SetInsertPoint(ReductionRoot ? ReductionRoot : &F->getEntryBlock().front()); auto *VectorRoot = vectorizeTree(VectorizableTree[0].get()); -- 2.7.4