[AMDGPU] Only count global-to-global as indirect accesses

author Jay Foad <jay.foad@amd.com>

Thu, 31 Mar 2022 12:39:02 +0000 (13:39 +0100)

committer Jay Foad <jay.foad@amd.com>

Fri, 1 Apr 2022 12:48:13 +0000 (13:48 +0100)
author Jay Foad <jay.foad@amd.com>
Thu, 31 Mar 2022 12:39:02 +0000 (13:39 +0100)
committer Jay Foad <jay.foad@amd.com>
Fri, 1 Apr 2022 12:48:13 +0000 (13:48 +0100)
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUPerfHintAnalysis.cpp b/llvm/lib/Target/AMDGPU/AMDGPUPerfHintAnalysis.cpp

index de97b76..b994b53 100644 (file)
--- a/llvm/lib/Target/AMDGPU/AMDGPUPerfHintAnalysis.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUPerfHintAnalysis.cpp
@@ -153,7 +153,7 @@ bool AMDGPUPerfHint::isIndirectAccess(const Instruction *Inst) const {
  
      if (auto LD = dyn_cast<LoadInst>(V)) {
        auto M = LD->getPointerOperand();
-      if (isGlobalAddr(M) || isLocalAddr(M) || isConstantAddr(M)) {
+      if (isGlobalAddr(M)) {
          LLVM_DEBUG(dbgs() << "    is IA\n");
          return true;
        }
diff --git a/llvm/test/CodeGen/AMDGPU/perfhint.ll b/llvm/test/CodeGen/AMDGPU/perfhint.ll

index 2fe01e8..296eeab 100644 (file)
--- a/llvm/test/CodeGen/AMDGPU/perfhint.ll
+++ b/llvm/test/CodeGen/AMDGPU/perfhint.ll
@@ -75,10 +75,9 @@ bb:
    ret void
  }
  
-; FIXME: This test was intended to be WaveLimiterHint : 0
  ; GCN-LABEL: {{^}}test_indirect_through_phi:
  ; GCN: MemoryBound: 0
-; GCN: WaveLimiterHint : 1
+; GCN: WaveLimiterHint : 0
  define amdgpu_kernel void @test_indirect_through_phi(float addrspace(1)* %arg) {
  bb:
    %load = load float, float addrspace(1)* %arg, align 8
diff --git a/llvm/test/CodeGen/AMDGPU/schedule-regpressure-limit2.ll b/llvm/test/CodeGen/AMDGPU/schedule-regpressure-limit2.ll

index d8dac0b..e209f9e 100644 (file)
--- a/llvm/test/CodeGen/AMDGPU/schedule-regpressure-limit2.ll
+++ b/llvm/test/CodeGen/AMDGPU/schedule-regpressure-limit2.ll
@@ -6,8 +6,8 @@
  ; SI-MINREG: NumSgprs: {{[1-9]$}}
  ; SI-MINREG: NumVgprs: {{[1-9]$}}
  
-; SI-MAXOCC: NumSgprs: {{[0-4][0-9]$}}
-; SI-MAXOCC: NumVgprs: {{[0-4][0-9]$}}
+; SI-MAXOCC: NumSgprs: {{[1-4]?[0-9]$}}
+; SI-MAXOCC: NumVgprs: {{[1-4]?[0-9]$}}
  
  ; stores may alias loads
  ; VI: NumSgprs: {{[0-9]$}}
author	Jay Foad <jay.foad@amd.com>
	Thu, 31 Mar 2022 12:39:02 +0000 (13:39 +0100)
committer	Jay Foad <jay.foad@amd.com>
	Fri, 1 Apr 2022 12:48:13 +0000 (13:48 +0100)
llvm/lib/Target/AMDGPU/AMDGPUPerfHintAnalysis.cpp		patch \| blob \| history
llvm/test/CodeGen/AMDGPU/perfhint.ll		patch \| blob \| history
llvm/test/CodeGen/AMDGPU/schedule-regpressure-limit2.ll		patch \| blob \| history