namespace
{
-constexpr unsigned int num_elems_processed_per_iteration = 16;
+constexpr unsigned int num_elems_processed_per_iteration = 1;
Status validate_arguments(const ITensorInfo *input1, const ITensorInfo *input2,
const ITensorInfo *output)
static_cast<cl::Kernel>(CLKernelLibraryEx::get().create_kernel(kernel_name, build_opts));
// Configure kernel window
- const unsigned int num_elems_processed_per_iteration = 1;
Window win = calculate_max_window(*input2->info(), Steps(num_elems_processed_per_iteration));
output->info()->set_valid_region(ValidRegion(Coordinates(), output->info()->tensor_shape()));