radeon/llvm: Run standard optimization passes on conpute shader modules 34/6634/1
authorTom Stellard <thomas.stellard@amd.com>
Tue, 14 May 2013 15:56:25 +0000 (08:56 -0700)
committerTom Stellard <thomas.stellard@amd.com>
Fri, 17 May 2013 14:38:01 +0000 (07:38 -0700)
The SROA and function inliner passes are espically important, because
they optimize away unsupported features: functions and indirect
private memory access.

src/gallium/drivers/radeon/radeon_llvm_util.c

index e3b0d63..25be245 100644 (file)
@@ -29,6 +29,7 @@
 
 #include <llvm-c/BitReader.h>
 #include <llvm-c/Core.h>
+#include <llvm-c/Transforms/PassManagerBuilder.h>
 
 LLVMModuleRef radeon_llvm_parse_bitcode(const unsigned char * bitcode,
                                                        unsigned bitcode_len)
@@ -50,6 +51,19 @@ unsigned radeon_llvm_get_num_kernels(const unsigned char *bitcode,
        return LLVMGetNamedMetadataNumOperands(mod, "opencl.kernels");
 }
 
+static void radeon_llvm_optimize(LLVMModuleRef mod)
+{
+       LLVMPassManagerBuilderRef builder = LLVMPassManagerBuilderCreate();
+       LLVMPassManagerRef pass_manager = LLVMCreatePassManager();
+
+       LLVMPassManagerBuilderUseInlinerWithThreshold(builder, 1000000000);
+       LLVMPassManagerBuilderPopulateModulePassManager(builder, pass_manager);
+
+       LLVMRunPassManager(pass_manager, mod);
+       LLVMPassManagerBuilderDispose(builder);
+       LLVMDisposePassManager(pass_manager);
+}
+
 LLVMModuleRef radeon_llvm_get_kernel_module(unsigned index,
                const unsigned char *bitcode, unsigned bitcode_len)
 {
@@ -72,5 +86,6 @@ LLVMModuleRef radeon_llvm_get_kernel_module(unsigned index,
                LLVMDeleteFunction(kernel_function);
        }
        FREE(kernel_metadata);
+       radeon_llvm_optimize(mod);
        return mod;
 }