--- /dev/null
+kernel void compiler_hadd(global int *src1, global int *src2, global int *dst) {
+ int i = get_global_id(0);
+ dst[i] = hadd(src1[i], src2[i]);
+}
--- /dev/null
+kernel void compiler_rhadd(global int *src1, global int *src2, global int *dst) {
+ int i = get_global_id(0);
+ dst[i] = rhadd(src1[i], src2[i]);
+}
compiler_global_constant.cpp
compiler_global_constant_2.cpp
compiler_group_size.cpp
+ compiler_hadd.cpp
compiler_if_else.cpp
compiler_integer_division.cpp
compiler_integer_remainder.cpp
compiler_lower_return1.cpp
compiler_lower_return2.cpp
compiler_multiple_kernels.cpp
+ compiler_rhadd.cpp
compiler_rotate.cpp
compiler_saturate.cpp
compiler_saturate_sub.cpp
--- /dev/null
+#include "utest_helper.hpp"
+
+void compiler_hadd(void)
+{
+ const int n = 32;
+ int src1[n], src2[n];
+
+ // Setup kernel and buffers
+ OCL_CREATE_KERNEL("compiler_hadd");
+ OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(int), NULL);
+ OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(int), NULL);
+ OCL_CREATE_BUFFER(buf[2], 0, n * sizeof(int), NULL);
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+ OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+ OCL_SET_ARG(2, sizeof(cl_mem), &buf[2]);
+ globals[0] = n;
+ locals[0] = 16;
+
+ OCL_MAP_BUFFER(0);
+ OCL_MAP_BUFFER(1);
+ for (int i = 0; i < n; ++i) {
+ src1[i] = ((int*)buf_data[0])[i] = rand();
+ src2[i] = ((int*)buf_data[1])[i] = rand();
+ }
+ OCL_UNMAP_BUFFER(0);
+ OCL_UNMAP_BUFFER(1);
+
+ OCL_NDRANGE(1);
+
+ OCL_MAP_BUFFER(2);
+ for (int i = 0; i < n; ++i) {
+ long long a = src1[i];
+ a += src2[i];
+ a >>= 1;
+ OCL_ASSERT(((int*)buf_data[2])[i] == (int)a);
+ }
+ OCL_UNMAP_BUFFER(2);
+}
+
+MAKE_UTEST_FROM_FUNCTION(compiler_hadd);
--- /dev/null
+#include "utest_helper.hpp"
+
+void compiler_rhadd(void)
+{
+ const int n = 32;
+ int src1[n], src2[n];
+
+ // Setup kernel and buffers
+ OCL_CREATE_KERNEL("compiler_rhadd");
+ OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(int), NULL);
+ OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(int), NULL);
+ OCL_CREATE_BUFFER(buf[2], 0, n * sizeof(int), NULL);
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+ OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+ OCL_SET_ARG(2, sizeof(cl_mem), &buf[2]);
+ globals[0] = n;
+ locals[0] = 16;
+
+ OCL_MAP_BUFFER(0);
+ OCL_MAP_BUFFER(1);
+ for (int i = 0; i < n; ++i) {
+ src1[i] = ((int*)buf_data[0])[i] = rand();
+ src2[i] = ((int*)buf_data[1])[i] = rand();
+ }
+ OCL_UNMAP_BUFFER(0);
+ OCL_UNMAP_BUFFER(1);
+
+ OCL_NDRANGE(1);
+
+ OCL_MAP_BUFFER(2);
+ for (int i = 0; i < n; ++i) {
+ long long a = src1[i];
+ a += src2[i];
+ a ++;
+ a >>= 1;
+ OCL_ASSERT(((int*)buf_data[2])[i] == (int)a);
+ }
+ OCL_UNMAP_BUFFER(2);
+}
+
+MAKE_UTEST_FROM_FUNCTION(compiler_rhadd);