diff options
author | Homer Hsing <homer.xing@intel.com> | 2013-02-01 13:48:59 +0800 |
---|---|---|
committer | Zhigang Gong <zhigang.gong@linux.intel.com> | 2013-04-10 14:52:32 +0800 |
commit | a985f4e11b21bb3fd2506a4b56c7f06891dbdd16 (patch) | |
tree | 90dd7213d99e944dd78f9a75e94ea075dc2c4216 /utests | |
parent | b3e9efd931ce0aa76cdf1480d1b685a5bcae695f (diff) |
Make "logical shift right" work
Before we fix the bug, the "logical shift right" is wrong:
(0xFF000000U >> 24) == 0xFFFFFFFF
After we fix the bug, it is right.
(0xFF000000U >> 24) == 0xFF
Also add a test case, test by 128 random input.
This patch fixes "component_transfer_linear" filter.
Signed-off-by: Homer Hsing <homer.xing@intel.com>
Reviewed-by: Zhigang Gong <zhigang.gong@linux.intel.com>
Tested-by: Zhigang Gong <zhigang.gong@linux.intel.com>
Diffstat (limited to 'utests')
-rw-r--r-- | utests/CMakeLists.txt | 1 | ||||
-rw-r--r-- | utests/compiler_shift_right.cpp | 45 |
2 files changed, 46 insertions, 0 deletions
diff --git a/utests/CMakeLists.txt b/utests/CMakeLists.txt index a5992410..c67cf341 100644 --- a/utests/CMakeLists.txt +++ b/utests/CMakeLists.txt @@ -37,6 +37,7 @@ ADD_LIBRARY(utests SHARED compiler_multiple_kernels.cpp compiler_saturate.cpp compiler_saturate_sub.cpp + compiler_shift_right.cpp compiler_short_scatter.cpp compiler_sub_bytes.cpp compiler_sub_shorts.cpp diff --git a/utests/compiler_shift_right.cpp b/utests/compiler_shift_right.cpp new file mode 100644 index 00000000..b94cc462 --- /dev/null +++ b/utests/compiler_shift_right.cpp @@ -0,0 +1,45 @@ +#include "utest_helper.hpp" + +typedef unsigned int uint; + +static void cpu(int global_id, uint *src, int *dst) { + dst[global_id] = src[global_id] >> 24; +} + +void compiler_shift_right(void) +{ + const size_t n = 16; + uint cpu_src[16]; + int cpu_dst[16]; + + // Setup kernel and buffers + OCL_CREATE_KERNEL("compiler_shift_right"); + OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(uint), NULL); + OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(int), NULL); + OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]); + OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]); + globals[0] = 16; + locals[0] = 16; + + // Run random tests + for (uint32_t pass = 0; pass < 8; ++pass) { + OCL_MAP_BUFFER(0); + for (int32_t i = 0; i < (int32_t) n; ++i) + cpu_src[i] = ((uint*)buf_data[0])[i] = 0x80000000 | rand(); + OCL_UNMAP_BUFFER(0); + + // Run the kernel on GPU + OCL_NDRANGE(1); + + // Run on CPU + for (int32_t i = 0; i < (int32_t) n; ++i) cpu(i, cpu_src, cpu_dst); + + // Compare + OCL_MAP_BUFFER(1); + for (int32_t i = 0; i < (int32_t) n; ++i) + OCL_ASSERT(((int *)buf_data[1])[i] == cpu_dst[i]); + OCL_UNMAP_BUFFER(1); + } +} + +MAKE_UTEST_FROM_FUNCTION(compiler_shift_right); |