W start = (tid == 0)? (W)0:sbuf[start_idx];\r
W end = sbuf[end_idx];\r
\r
- if (blockIdx.x == 0)\r
- printf("%d~~~~~~~~ start_idx %d, end_idx %d, start %f, end %f\n",\r
- tid, start_idx, end_idx, start, end);\r
-\r
dst(y, out_stride + tid) = (end - start);\r
}\r
}\r
W start = (tid == 0)? (W)0:sbuf[start_idx];\r
W end = sbuf[end_idx];\r
\r
- if (blockIdx.x == 0)\r
- printf("!!!!!!!!%d~~~~~~~~ start_idx %d, end_idx %d, start %f, end %f\n",\r
- tid, start_idx, end_idx, start, end);\r
-\r
dst(out_stride + tid, x) = saturate_cast<T>((end - start) * scale);\r
}\r
}\r
int thred_lines = divUp(src.cols, input_stride * iscale_x);\r
int blocks = src.rows * thred_lines;\r
\r
- printf("device code executed for X coordinate with:\nsize %d warps %d, threads %d, thred_lines %d, blocks %d input strude %d\n",\r
- src.cols, warps, threads, thred_lines, blocks, input_stride * iscale_x);\r
-\r
typedef typename scan_traits<T>::scan_line_type smem_type;\r
\r
resise_scan_fast_x<T, smem_type><<<blocks, threads, warps * 32 * sizeof(smem_type)>>>\r
thred_lines = divUp(src.rows, input_stride * iscale_y);\r
blocks = dst.cols * thred_lines;\r
\r
- printf("device code executed for Y coordinate with:\nsize %d warps %d, threads %d, thred_lines %d, blocks %d\n",\r
- dst.rows, warps, threads, thred_lines, blocks);\r
-\r
resise_scan_fast_y<T, smem_type><<<blocks, threads, warps * 32 * sizeof(smem_type)>>>\r
(buffer, dst, iscale_x, iscale_y, thred_lines, input_stride * iscale_y);\r
\r