--- /dev/null
+__kernel
+void compiler_bool_cross_basic_block(__global int *src,
+ __global int *dst,
+ int scale){
+ int id = (int)get_global_id(0);
+
+ bool isRedRow = false;
+ bool isRed;
+ int val = src[id];
+ for (unsigned int i=0; i<scale; i++, isRedRow = !isRedRow) {
+ if (isRedRow) {
+ isRed= false;
+ for (unsigned int j=0; j < scale; j++, isRed=!isRed) {
+ if (isRed) {
+ val++;
+ }
+ }
+ }
+ }
+ dst[id] = val;
+}
compiler_insn_selection_min.cpp
compiler_insn_selection_max.cpp
compiler_insn_selection_masked_min_max.cpp
- compiler_load_bool_imm.cpp
+ compiler_load_bool_imm.cpp
compiler_global_memory_barrier.cpp
compiler_local_memory_two_ptr.cpp
compiler_local_memory_barrier.cpp
builtin_acos_asin.cpp
runtime_createcontext.cpp
runtime_null_kernel_arg.cpp
- runtime_event.cpp
+ runtime_event.cpp
compiler_double.cpp
compiler_double_2.cpp
compiler_double_3.cpp
compiler_long_asr.cpp
compiler_long_mult.cpp
compiler_long_cmp.cpp
+ #compiler_bool_cross_basic_block.cpp
utest_assert.cpp
utest.cpp
utest_file_map.cpp
--- /dev/null
+#include "utest_helper.hpp"
+
+static void cpu(int global_id, int *src, int *dst, int scale) {
+ bool isRedRow = false;
+ bool isRed;
+ int val = src[global_id];
+ for (int i=0; i<scale; i++, isRedRow = !isRedRow) {
+ if (isRedRow) {
+ isRed= false;
+ for (int j=0; j < scale; j++, isRed=!isRed) {
+ if (isRed) {
+ val++;
+ }
+ }
+ }
+ }
+ dst[global_id] = val;
+}
+
+void compiler_bool_cross_basic_block(void){
+ const size_t n = 16;
+ int cpu_dst[16], cpu_src[16];
+ int scale = 4;
+
+ // Setup kernel and buffers
+ OCL_CREATE_KERNEL("compiler_bool_cross_basic_block");
+ OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(int), NULL);
+ OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(int), NULL);
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+ OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+ OCL_SET_ARG(2, sizeof(int), &scale);
+ globals[0] = 16;
+ locals[0] = 16;
+
+ OCL_MAP_BUFFER(0);
+ for (int32_t i = 0; i < (int32_t) n; ++i)
+ cpu_src[i] = ((int*)buf_data[0])[i] = i;
+ OCL_UNMAP_BUFFER(0);
+
+ // Run the kernel on GPU
+ OCL_NDRANGE(1);
+
+ // Run on CPU
+ for (int32_t i = 0; i < (int32_t) n; ++i)
+ cpu(i, cpu_src, cpu_dst, scale);
+
+ // Compare
+ OCL_MAP_BUFFER(1);
+ for (int32_t i = 0; i < (int32_t) n; ++i)
+ OCL_ASSERT(((int *)buf_data[1])[i] == cpu_dst[i]);
+ OCL_UNMAP_BUFFER(1);
+
+}
+
+
+MAKE_UTEST_FROM_FUNCTION(compiler_bool_cross_basic_block)