[update] GPU FC layer updated with latest pipeline changes
authorDebadri Samaddar <s.debadri@samsung.com>
Mon, 7 Oct 2024 06:29:27 +0000 (11:59 +0530)
committerJijoong Moon <jijoong.moon@samsung.com>
Mon, 14 Oct 2024 07:34:01 +0000 (16:34 +0900)
Removed cl_context dependencies from fc_layer_cl.
Modified blas function calls accordingly.

Signed-off-by: Debadri Samaddar <s.debadri@samsung.com>
nntrainer/cl_context.cpp
nntrainer/layers/cl_layers/fc_layer_cl.cpp
nntrainer/layers/cl_layers/meson.build

index 821a32d6fa17de2006f813da154d5c7363a9c38f..f32c8301d9381ff1fb0c6bd482725746394c251d 100644 (file)
@@ -31,9 +31,9 @@ std::once_flag global_cl_context_init_flag;
 
 static void add_default_object(ClContext &cc) {
 
-  // cc.registerFactory(nntrainer::createLayer<FullyConnectedLayerCl>,
-  //                    FullyConnectedLayerCl::type,
-  //                    ml::train::LayerType::LAYER_FC);
+  cc.registerFactory(nntrainer::createLayer<FullyConnectedLayerCl>,
+                     FullyConnectedLayerCl::type,
+                     ml::train::LayerType::LAYER_FC);
 
   // cc.registerFactory(nntrainer::createLayer<AdditionLayerCL>,
   //                    AdditionLayerCL::type,
index 0e3cb178f0433fe28df7e63d368937741233ba86..adcd940300dcaff3681297267ea4245d8cf5e158 100644 (file)
@@ -127,9 +127,9 @@ void FullyConnectedLayerCl::forwarding(RunLayerContext &context,
     // Dequantize is currently disabled
     // weight.dequantize(weight_, axis);
 
-    dotCl(input_, weight_, hidden_, context);
+    dotCl(input_, weight_, hidden_);
   } else {
-    dotCl(input_, weight, hidden_, context);
+    dotCl(input_, weight, hidden_);
   }
 
   if (auto &disable_bias = std::get<props::DisableBias>(*layer_impl_props);
@@ -171,7 +171,7 @@ void FullyConnectedLayerCl::incremental_forwarding(RunLayerContext &context,
   Tensor input_step = input_.getSharedDataTensor(input_step_dim, 0, true);
   Tensor hidden_step = hidden_.getSharedDataTensor(hidden_step_dim, 0, true);
 
-  dotCl(input_step, weight, hidden_step, context);
+  dotCl(input_step, weight, hidden_step);
 
   if (auto &disable_bias = std::get<props::DisableBias>(*layer_impl_props);
       disable_bias.empty() || disable_bias.get() == false) {
index 906b8a85ac6f900d9044affc21f3982211f59a69..f9d740f00c3f7a3b620369533e6518bdf2cec81d 100644 (file)
@@ -1,5 +1,5 @@
 cl_layer_sources = [
-  # 'fc_layer_cl.cpp',
+    'fc_layer_cl.cpp',
   # 'addition_layer_cl.cpp',
   # 'swiglu_cl.cpp',
   # 'reshape_cl.cpp',