[X86] [AMX] Fix the test case failure caused by D107544.

author Bing1 Yu <bing1.yu@intel.com>

Wed, 18 Aug 2021 05:40:19 +0000 (13:40 +0800)

committer Bing1 Yu <bing1.yu@intel.com>

Wed, 18 Aug 2021 14:27:22 +0000 (22:27 +0800)
author Bing1 Yu <bing1.yu@intel.com>
Wed, 18 Aug 2021 05:40:19 +0000 (13:40 +0800)
committer Bing1 Yu <bing1.yu@intel.com>
Wed, 18 Aug 2021 14:27:22 +0000 (22:27 +0800)
diff --git a/llvm/lib/Target/X86/X86LowerAMXType.cpp b/llvm/lib/Target/X86/X86LowerAMXType.cpp

index a2bcc98..e150f2d 100644 (file)
--- a/llvm/lib/Target/X86/X86LowerAMXType.cpp
+++ b/llvm/lib/Target/X86/X86LowerAMXType.cpp
@@ -898,10 +898,12 @@ bool X86LowerAMXCast::combineAMXcast(TargetLibraryInfo *TLI) {
    Convert(Vec2TileInsts, Intrinsic::x86_cast_tile_to_vector);
    Convert(Tile2VecInsts, Intrinsic::x86_cast_vector_to_tile);
  
-  auto EraseInst = [](SmallVectorImpl<Instruction *> &Insts) {
+  auto EraseInst = [&](SmallVectorImpl<Instruction *> &Insts) {
      for (auto *Inst : Insts) {
-      if (Inst->use_empty())
+      if (Inst->use_empty()) {
          Inst->eraseFromParent();
+        Change = true;
+      }
      }
    };
  
@@ -912,7 +914,7 @@ bool X86LowerAMXCast::combineAMXcast(TargetLibraryInfo *TLI) {
    for (BasicBlock &BB : Func) {
      for (Instruction &I : BB) {
        if (isAMXCast(&I)) {
-        if (PHINode *PN = dyn_cast<PHINode>(I.getOperand(0)))
+        if (isa<PHINode>(I.getOperand(0)))
            PhiCastWorkList.push_back(&I);
        }
      }
@@ -1036,17 +1038,18 @@ public:
    }
  
    bool runOnFunction(Function &F) override {
+    bool C = false;
      TargetMachine *TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();
      TargetLibraryInfo *TLI =
          &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);
      X86LowerAMXCast LAC(F);
-    LAC.combineAMXcast(TLI);
+    C |= LAC.combineAMXcast(TLI);
      // There might be remaining AMXcast after combineAMXcast and they should be
      // handled elegantly.
-    LAC.transformAllAMXCast();
+    C |= LAC.transformAllAMXCast();
  
      X86LowerAMXType LAT(F);
-    bool C = LAT.visit();
+    C |= LAT.visit();
  
      // Prepare for fast register allocation at O0.
      // Todo: May better check the volatile model of AMX code, not just
author	Bing1 Yu <bing1.yu@intel.com>
	Wed, 18 Aug 2021 05:40:19 +0000 (13:40 +0800)
committer	Bing1 Yu <bing1.yu@intel.com>
	Wed, 18 Aug 2021 14:27:22 +0000 (22:27 +0800)