add utest compiler_overflow for llvm intrinsic function.
authorLuo Xionghu <xionghu.luo@intel.com>
Mon, 27 Oct 2014 03:14:50 +0000 (11:14 +0800)
committerZhigang Gong <zhigang.gong@intel.com>
Tue, 28 Oct 2014 02:14:46 +0000 (10:14 +0800)
this case only runs for uadd_with_over_flow function so far.

Signed-off-by: Luo Xionghu <xionghu.luo@intel.com>
Reviewed-by: Zhigang Gong <zhigang.gong@linux.intel.com>
kernels/compiler_overflow.cl [new file with mode: 0644]
utests/CMakeLists.txt
utests/compiler_overflow.cpp [new file with mode: 0644]

diff --git a/kernels/compiler_overflow.cl b/kernels/compiler_overflow.cl
new file mode 100644 (file)
index 0000000..75ed5ce
--- /dev/null
@@ -0,0 +1,20 @@
+#define COMPILER_OVERFLOW(TYPE) \
+    kernel void compiler_overflow_##TYPE (global TYPE* src, global TYPE* dst)   \
+{                                                \
+  __global TYPE* A = &src[get_global_id(0)];    \
+  TYPE B = 1; \
+  *A += B;    \
+  TYPE carry = -convert_##TYPE((*A) < B); \
+               \
+  (*A).y += carry.x;  \
+  carry.y += ((*A).y < carry.x); \
+  (*A).z += carry.y;   \
+    \
+  carry.z += ((*A).z < carry.y); \
+  (*A).w += carry.z; \
+   dst[get_global_id(0)] = src[get_global_id(0)]; \
+}
+
+COMPILER_OVERFLOW(uint4)
+COMPILER_OVERFLOW(ushort4)
+COMPILER_OVERFLOW(uchar4)
index cf3addc..bd1c65f 100644 (file)
@@ -104,6 +104,7 @@ set (utests_sources
   compiler_write_only.cpp
   compiler_write_only_shorts.cpp
   compiler_switch.cpp
+  compiler_overflow.cpp
   compiler_math.cpp
   compiler_atomic_functions.cpp
   compiler_async_copy.cpp
diff --git a/utests/compiler_overflow.cpp b/utests/compiler_overflow.cpp
new file mode 100644 (file)
index 0000000..1d3f53d
--- /dev/null
@@ -0,0 +1,72 @@
+#include "utest_helper.hpp"
+
+namespace {
+
+typedef struct {
+  uint32_t x;
+  uint32_t y;
+  uint32_t z;
+  uint32_t w;
+} uint4;
+
+typedef struct {
+  uint16_t x;
+  uint16_t y;
+  uint16_t z;
+  uint16_t w;
+} ushort4;
+
+typedef struct {
+  uint8_t x;
+  uint8_t y;
+  uint8_t z;
+  uint8_t w;
+} uchar4;
+
+template<typename T>
+void test(const char *kernel_name, int s_type)
+{
+  const size_t n = 16;
+
+  // Setup kernel and buffers
+  OCL_CREATE_KERNEL_FROM_FILE("compiler_overflow", kernel_name);
+  OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(T), NULL);
+  OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(T), NULL);
+  OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+  OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+
+  OCL_MAP_BUFFER(0);
+  for (uint32_t i = 0; i < n; ++i) {
+    ((T*)buf_data[0])[i].x = s_type?CL_INT_MAX:CL_UINT_MAX;
+    ((T*)buf_data[0])[i].y = s_type?CL_INT_MAX:CL_UINT_MAX;
+    ((T*)buf_data[0])[i].z = s_type?CL_INT_MAX:CL_UINT_MAX;
+    ((T*)buf_data[0])[i].w = i;
+  }
+  OCL_UNMAP_BUFFER(0);
+
+  globals[0] = n;
+  locals[0] = 16;
+  OCL_NDRANGE(1);
+
+  OCL_MAP_BUFFER(1);
+  for (uint32_t i = 0; i < 16; ++i) {
+    OCL_ASSERT(((T*)buf_data[1])[i].x == 0);
+    OCL_ASSERT(((T*)buf_data[1])[i].y == 1);
+    OCL_ASSERT(((T*)buf_data[1])[i].z == 1);
+    OCL_ASSERT(((T*)buf_data[1])[i].w == i+2);
+  }
+  OCL_UNMAP_BUFFER(1);
+}
+
+}
+
+#define compiler_overflow(type, kernel, s_type) \
+static void compiler_overflow_ ##type(void)\
+{\
+  test<type>(# kernel, s_type);\
+}\
+MAKE_UTEST_FROM_FUNCTION(compiler_overflow_ ## type);
+
+compiler_overflow(uint4, compiler_overflow_uint4, 0)
+compiler_overflow(ushort4, compiler_overflow_ushort4, 0)
+compiler_overflow(uchar4, compiler_overflow_uchar4, 0)