[AMDGPU] Add CL option for max-ilp scheduler.

author Austin Kerbow <Austin.Kerbow@amd.com>

Tue, 2 Aug 2022 21:15:00 +0000 (14:15 -0700)

committer Austin Kerbow <Austin.Kerbow@amd.com>

Tue, 2 Aug 2022 23:52:14 +0000 (16:52 -0700)
author Austin Kerbow <Austin.Kerbow@amd.com>
Tue, 2 Aug 2022 21:15:00 +0000 (14:15 -0700)
committer Austin Kerbow <Austin.Kerbow@amd.com>
Tue, 2 Aug 2022 23:52:14 +0000 (16:52 -0700)
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp

index 643eb0b..103a72b 100644 (file)
--- a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp
@@ -327,6 +327,11 @@ static cl::opt<bool> EnablePromoteKernelArguments(
      cl::desc("Enable promotion of flat kernel pointer arguments to global"),
      cl::Hidden, cl::init(true));
  
      cl::desc("Enable promotion of flat kernel pointer arguments to global"),
      cl::Hidden, cl::init(true));
  
+static cl::opt<bool> EnableMaxIlpSchedStrategy(
+    "amdgpu-enable-max-ilp-scheduling-strategy",
+    cl::desc("Enable scheduling strategy to maximize ILP for a single wave."),
+    cl::Hidden, cl::init(false));
+
  extern "C" LLVM_EXTERNAL_VISIBILITY void LLVMInitializeAMDGPUTarget() {
    // Register the target
    RegisterTargetMachine<R600TargetMachine> X(getTheAMDGPUTarget());
  extern "C" LLVM_EXTERNAL_VISIBILITY void LLVMInitializeAMDGPUTarget() {
    // Register the target
    RegisterTargetMachine<R600TargetMachine> X(getTheAMDGPUTarget());
@@ -1161,6 +1166,10 @@ ScheduleDAGInstrs *GCNPassConfig::createMachineScheduler(
    const GCNSubtarget &ST = C->MF->getSubtarget<GCNSubtarget>();
    if (ST.enableSIScheduler())
      return createSIMachineScheduler(C);
    const GCNSubtarget &ST = C->MF->getSubtarget<GCNSubtarget>();
    if (ST.enableSIScheduler())
      return createSIMachineScheduler(C);
+
+  if (EnableMaxIlpSchedStrategy)
+    return createGCNMaxILPMachineScheduler(C);
+
    return createGCNMaxOccupancyMachineScheduler(C);
  }
  
    return createGCNMaxOccupancyMachineScheduler(C);
  }
  
diff --git a/llvm/test/CodeGen/AMDGPU/schedule-ilp.ll b/llvm/test/CodeGen/AMDGPU/schedule-ilp.ll

index ea5062c..52fa123 100644 (file)
--- a/llvm/test/CodeGen/AMDGPU/schedule-ilp.ll
+++ b/llvm/test/CodeGen/AMDGPU/schedule-ilp.ll
@@ -1,5 +1,6 @@
  ; RUN: llc -march=amdgcn -mcpu=tonga -misched=gcn-iterative-ilp -verify-machineinstrs < %s | FileCheck %s
  ; RUN: llc -march=amdgcn -mcpu=tonga -misched=gcn-max-ilp -verify-machineinstrs < %s | FileCheck %s
  ; RUN: llc -march=amdgcn -mcpu=tonga -misched=gcn-iterative-ilp -verify-machineinstrs < %s | FileCheck %s
  ; RUN: llc -march=amdgcn -mcpu=tonga -misched=gcn-max-ilp -verify-machineinstrs < %s | FileCheck %s
+; RUN: llc -march=amdgcn -mcpu=tonga -amdgpu-enable-max-ilp-scheduling-strategy -verify-machineinstrs < %s | FileCheck %s
  
  ; CHECK: NumVgprs: {{[0-9][0-9][0-9]$}}
  
  
  ; CHECK: NumVgprs: {{[0-9][0-9][0-9]$}}
author	Austin Kerbow <Austin.Kerbow@amd.com>
	Tue, 2 Aug 2022 21:15:00 +0000 (14:15 -0700)
committer	Austin Kerbow <Austin.Kerbow@amd.com>
	Tue, 2 Aug 2022 23:52:14 +0000 (16:52 -0700)
llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp		patch \| blob \| history
llvm/test/CodeGen/AMDGPU/schedule-ilp.ll		patch \| blob \| history