Tensor3D input2 = CONVERT_TO_TENSOR3D_STRUCT(input2);
Tensor3D output = CONVERT_TO_TENSOR3D_STRUCT(output);
+ VEC_DATA_TYPE(DATA_TYPE, VEC_SIZE)
+ diff = VLOAD(VEC_SIZE)(0, (__global DATA_TYPE *)input1.ptr)- VLOAD(VEC_SIZE)(0, (__global DATA_TYPE *)input2.ptr);
+
+ VEC_DATA_TYPE(DATA_TYPE, VEC_SIZE)
+ sq_diff = diff * diff;
+
VSTORE(VEC_SIZE)
- (pow(VLOAD(VEC_SIZE)(0, (__global DATA_TYPE *)input1.ptr) - VLOAD(VEC_SIZE)(0, (__global DATA_TYPE *)input2.ptr), 2),
- 0, (__global DATA_TYPE *)output.ptr);
+ (sq_diff, 0, (__global DATA_TYPE *)output.ptr);
}