[bugfix/blas] Fixed sgemm_cl poiner check
authorDebadri Samaddar <s.debadri@samsung.com>
Thu, 3 Oct 2024 09:32:08 +0000 (15:02 +0530)
committerJijoong Moon <jijoong.moon@samsung.com>
Mon, 14 Oct 2024 07:33:44 +0000 (16:33 +0900)
Fixed failing condition in sgemm_cl and function call argument

Signed-off-by: Debadri Samaddar <s.debadri@samsung.com>
nntrainer/tensor/cl_operations/blas_kernels_fp16.cpp

index 18bbd8c7fbe7416f500439f18c3b96de154473f1..6aa7ccb6e23230b753d56217a34014fe2fc0fc28 100644 (file)
@@ -203,7 +203,7 @@ void sgemm_cl(bool TransA, bool TransB, const __fp16 *A, const __fp16 *B,
   do {
     ClContext::SharedPtrClKernel kernel_sgemm_fp16_ptr =
       cl_context_ref.registerClKernel(sgemm_cl_kernel_fp16_, kernel_func_);
-    if (!result) {
+    if (!kernel_sgemm_fp16_ptr) {
       break;
     }
 
@@ -278,7 +278,7 @@ void sgemm_cl(bool TransA, bool TransB, const __fp16 *A, const __fp16 *B,
     const int work_group_size[3] = {32, 32, 1}; // test-value
 
     result = cl_context_ref.command_queue_inst_.DispatchCommand(
-      *kernel_sgemm_fp16_ptr, work_groups_count, work_group_size);
+      kernel_sgemm_fp16_ptr, work_groups_count, work_group_size);
     if (!result) {
       break;
     }