From e230d9debbd4c2e715f50059a02d502d90a626d7 Mon Sep 17 00:00:00 2001 From: Tom Stellard Date: Tue, 14 May 2013 08:56:25 -0700 Subject: [PATCH] radeon/llvm: Run standard optimization passes on conpute shader modules The SROA and function inliner passes are espically important, because they optimize away unsupported features: functions and indirect private memory access. --- src/gallium/drivers/radeon/radeon_llvm_util.c | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/src/gallium/drivers/radeon/radeon_llvm_util.c b/src/gallium/drivers/radeon/radeon_llvm_util.c index e3b0d63..25be245 100644 --- a/src/gallium/drivers/radeon/radeon_llvm_util.c +++ b/src/gallium/drivers/radeon/radeon_llvm_util.c @@ -29,6 +29,7 @@ #include #include +#include LLVMModuleRef radeon_llvm_parse_bitcode(const unsigned char * bitcode, unsigned bitcode_len) @@ -50,6 +51,19 @@ unsigned radeon_llvm_get_num_kernels(const unsigned char *bitcode, return LLVMGetNamedMetadataNumOperands(mod, "opencl.kernels"); } +static void radeon_llvm_optimize(LLVMModuleRef mod) +{ + LLVMPassManagerBuilderRef builder = LLVMPassManagerBuilderCreate(); + LLVMPassManagerRef pass_manager = LLVMCreatePassManager(); + + LLVMPassManagerBuilderUseInlinerWithThreshold(builder, 1000000000); + LLVMPassManagerBuilderPopulateModulePassManager(builder, pass_manager); + + LLVMRunPassManager(pass_manager, mod); + LLVMPassManagerBuilderDispose(builder); + LLVMDisposePassManager(pass_manager); +} + LLVMModuleRef radeon_llvm_get_kernel_module(unsigned index, const unsigned char *bitcode, unsigned bitcode_len) { @@ -72,5 +86,6 @@ LLVMModuleRef radeon_llvm_get_kernel_module(unsigned index, LLVMDeleteFunction(kernel_function); } FREE(kernel_metadata); + radeon_llvm_optimize(mod); return mod; } -- 2.7.4