2 // Copyright © 2017 Arm Ltd. All rights reserved.
3 // SPDX-License-Identifier: MIT
6 #include <armnn/test/CreateWorkload.hpp>
8 #include <backends/CpuTensorHandle.hpp>
9 #include <backends/reference/RefWorkloadFactory.hpp>
10 #include <backends/reference/workloads/RefWorkloads.hpp>
15 template<typename Workload>
16 void CheckInputOutput(std::unique_ptr<Workload> workload, const TensorInfo& inputInfo, const TensorInfo& outputInfo)
18 auto queueDescriptor = workload->GetData();
19 auto inputHandle = boost::polymorphic_downcast<ConstCpuTensorHandle*>(queueDescriptor.m_Inputs[0]);
20 auto outputHandle = boost::polymorphic_downcast<CpuTensorHandle*>(queueDescriptor.m_Outputs[0]);
21 BOOST_TEST((inputHandle->GetTensorInfo() == inputInfo));
22 BOOST_TEST((outputHandle->GetTensorInfo() == outputInfo));
25 template <typename Workload>
26 void CheckInputsOutput(std::unique_ptr<Workload> workload,
27 const TensorInfo& inputInfo0,
28 const TensorInfo& inputInfo1,
29 const TensorInfo& outputInfo)
31 auto queueDescriptor = workload->GetData();
32 auto inputHandle0 = boost::polymorphic_downcast<ConstCpuTensorHandle*>(queueDescriptor.m_Inputs[0]);
33 auto inputHandle1 = boost::polymorphic_downcast<ConstCpuTensorHandle*>(queueDescriptor.m_Inputs[1]);
34 auto outputHandle = boost::polymorphic_downcast<CpuTensorHandle*>(queueDescriptor.m_Outputs[0]);
35 BOOST_TEST((inputHandle0->GetTensorInfo() == inputInfo0));
36 BOOST_TEST((inputHandle1->GetTensorInfo() == inputInfo1));
37 BOOST_TEST((outputHandle->GetTensorInfo() == outputInfo));
41 BOOST_AUTO_TEST_SUITE(CreateWorkloadRef)
43 template <typename ActivationWorkloadType, armnn::DataType DataType>
44 static void RefCreateActivationWorkloadTest()
47 RefWorkloadFactory factory;
48 auto workload = CreateActivationWorkloadTest<ActivationWorkloadType, DataType>(factory, graph);
50 // Checks that outputs are as we expect them (see definition of CreateActivationWorkloadTest).
51 CheckInputOutput(std::move(workload),
52 TensorInfo({ 1, 1 }, DataType),
53 TensorInfo({ 1, 1 }, DataType));
56 BOOST_AUTO_TEST_CASE(CreateActivationFloat32Workload)
58 RefCreateActivationWorkloadTest<RefActivationFloat32Workload, armnn::DataType::Float32>();
61 BOOST_AUTO_TEST_CASE(CreateActivationUint8Workload)
63 RefCreateActivationWorkloadTest<RefActivationUint8Workload, armnn::DataType::QuantisedAsymm8>();
66 template <typename WorkloadType,
67 typename DescriptorType,
69 armnn::DataType DataType>
70 static void RefCreateArithmethicWorkloadTest()
73 RefWorkloadFactory factory;
74 auto workload = CreateArithmeticWorkloadTest<WorkloadType, DescriptorType, LayerType, DataType>(factory, graph);
76 CheckInputsOutput(std::move(workload),
77 TensorInfo({ 2, 3 }, DataType),
78 TensorInfo({ 2, 3 }, DataType),
79 TensorInfo({ 2, 3 }, DataType));
82 BOOST_AUTO_TEST_CASE(CreateAdditionFloatWorkload)
84 RefCreateArithmethicWorkloadTest<RefAdditionFloat32Workload,
85 AdditionQueueDescriptor,
87 armnn::DataType::Float32>();
90 BOOST_AUTO_TEST_CASE(CreateAdditionUint8Workload)
92 RefCreateArithmethicWorkloadTest<RefAdditionUint8Workload,
93 AdditionQueueDescriptor,
95 armnn::DataType::QuantisedAsymm8>();
98 BOOST_AUTO_TEST_CASE(CreateSubtractionFloatWorkload)
100 RefCreateArithmethicWorkloadTest<RefSubtractionFloat32Workload,
101 SubtractionQueueDescriptor,
103 armnn::DataType::Float32>();
106 BOOST_AUTO_TEST_CASE(CreateSubtractionUint8Workload)
108 RefCreateArithmethicWorkloadTest<RefSubtractionUint8Workload,
109 SubtractionQueueDescriptor,
111 armnn::DataType::QuantisedAsymm8>();
114 BOOST_AUTO_TEST_CASE(CreateMultiplicationFloatWorkload)
116 RefCreateArithmethicWorkloadTest<RefMultiplicationFloat32Workload,
117 MultiplicationQueueDescriptor,
119 armnn::DataType::Float32>();
122 BOOST_AUTO_TEST_CASE(CreateMultiplicationUint8Workload)
124 RefCreateArithmethicWorkloadTest<RefMultiplicationUint8Workload,
125 MultiplicationQueueDescriptor,
127 armnn::DataType::QuantisedAsymm8>();
130 BOOST_AUTO_TEST_CASE(CreateDivisionFloatWorkload)
132 RefCreateArithmethicWorkloadTest<RefDivisionFloat32Workload,
133 DivisionQueueDescriptor,
135 armnn::DataType::Float32>();
138 BOOST_AUTO_TEST_CASE(CreateDivisionUint8Workload)
140 RefCreateArithmethicWorkloadTest<RefDivisionUint8Workload,
141 DivisionQueueDescriptor,
143 armnn::DataType::QuantisedAsymm8>();
146 BOOST_AUTO_TEST_CASE(CreateBatchNormalizationWorkload)
149 RefWorkloadFactory factory;
150 auto workload = CreateBatchNormalizationWorkloadTest<RefBatchNormalizationFloat32Workload, armnn::DataType::Float32>
153 // Checks that outputs and inputs are as we expect them (see definition of CreateBatchNormalizationWorkloadTest).
155 std::move(workload), TensorInfo({2, 3, 1, 1}, DataType::Float32), TensorInfo({2, 3, 1, 1}, DataType::Float32));
158 BOOST_AUTO_TEST_CASE(CreateConvertFp16ToFp32Float32Workload)
161 RefWorkloadFactory factory;
162 auto workload = CreateConvertFp16ToFp32WorkloadTest<RefConvertFp16ToFp32Workload>(factory, graph);
164 // Checks that outputs and inputs are as we expect them
166 std::move(workload), TensorInfo({1, 3, 2, 3}, DataType::Float16), TensorInfo({1, 3, 2, 3}, DataType::Float32));
169 BOOST_AUTO_TEST_CASE(CreateConvertFp32ToFp16Float16Workload)
172 RefWorkloadFactory factory;
173 auto workload = CreateConvertFp32ToFp16WorkloadTest<RefConvertFp32ToFp16Workload>(factory, graph);
175 // Checks that outputs and inputs are as we expect them
177 std::move(workload), TensorInfo({1, 3, 2, 3}, DataType::Float32), TensorInfo({1, 3, 2, 3}, DataType::Float16));
180 static void RefCreateConvolution2dWorkloadTest(DataLayout dataLayout = DataLayout::NCHW)
183 RefWorkloadFactory factory;
184 auto workload = CreateConvolution2dWorkloadTest<RefConvolution2dFloat32Workload, DataType::Float32>
185 (factory, graph, dataLayout);
187 std::initializer_list<unsigned int> inputShape = (dataLayout == DataLayout::NCHW) ?
188 std::initializer_list<unsigned int>({2, 3, 8, 16}) : std::initializer_list<unsigned int>({2, 8, 16, 3});
189 std::initializer_list<unsigned int> outputShape = (dataLayout == DataLayout::NCHW) ?
190 std::initializer_list<unsigned int>({2, 2, 2, 10}) : std::initializer_list<unsigned int>({2, 2, 10, 2});
192 // Checks that outputs and inputs are as we expect them (see definition of CreateConvolution2dWorkloadTest).
193 CheckInputOutput(std::move(workload),
194 TensorInfo(inputShape, DataType::Float32),
195 TensorInfo(outputShape, DataType::Float32));
198 BOOST_AUTO_TEST_CASE(CreateConvolution2dFloatNchwWorkload)
200 RefCreateConvolution2dWorkloadTest(DataLayout::NCHW);
203 BOOST_AUTO_TEST_CASE(CreateConvolution2dFloatNhwcWorkload)
205 RefCreateConvolution2dWorkloadTest(DataLayout::NHWC);
208 template <typename FullyConnectedWorkloadType, armnn::DataType DataType>
209 static void RefCreateFullyConnectedWorkloadTest()
212 RefWorkloadFactory factory;
213 auto workload = CreateFullyConnectedWorkloadTest<FullyConnectedWorkloadType, DataType>(factory, graph);
215 // Checks that outputs and inputs are as we expect them (see definition of CreateFullyConnectedWorkloadTest).
216 float inputsQScale = DataType == armnn::DataType::QuantisedAsymm8 ? 1.0f : 0.0;
217 float outputQScale = DataType == armnn::DataType::QuantisedAsymm8 ? 2.0f : 0.0;
218 CheckInputOutput(std::move(workload),
219 TensorInfo({ 3, 1, 4, 5 }, DataType, inputsQScale),
220 TensorInfo({ 3, 7 }, DataType, outputQScale));
223 BOOST_AUTO_TEST_CASE(CreateFullyConnectedFloat32Workload)
225 RefCreateFullyConnectedWorkloadTest<RefFullyConnectedFloat32Workload, armnn::DataType::Float32>();
228 BOOST_AUTO_TEST_CASE(CreateFullyConnectedUint8Workload)
230 RefCreateFullyConnectedWorkloadTest<RefFullyConnectedUint8Workload, armnn::DataType::QuantisedAsymm8>();
233 template <typename NormalizationWorkloadType, armnn::DataType DataType>
234 static void RefCreateNormalizationWorkloadTest()
237 RefWorkloadFactory factory;
238 auto workload = CreateNormalizationWorkloadTest<NormalizationWorkloadType, DataType>(factory, graph);
240 // Checks that outputs and inputs are as we expect them (see definition of CreateNormalizationWorkloadTest).
241 CheckInputOutput(std::move(workload),
242 TensorInfo({3, 5, 5, 1}, DataType),
243 TensorInfo({3, 5, 5, 1}, DataType));
246 BOOST_AUTO_TEST_CASE(CreateRefNormalizationNchwWorkload)
248 RefCreateNormalizationWorkloadTest<RefNormalizationFloat32Workload, armnn::DataType::Float32>();
251 template <typename Pooling2dWorkloadType, armnn::DataType DataType>
252 static void RefCreatePooling2dWorkloadTest()
255 RefWorkloadFactory factory;
256 auto workload = CreatePooling2dWorkloadTest<Pooling2dWorkloadType, DataType>(factory, graph);
258 // Checks that outputs and inputs are as we expect them (see definition of CreatePooling2dWorkloadTest).
261 TensorInfo({3, 2, 5, 5}, DataType),
262 TensorInfo({3, 2, 2, 4}, DataType));
265 BOOST_AUTO_TEST_CASE(CreatePooling2dFloat32Workload)
267 RefCreatePooling2dWorkloadTest<RefPooling2dFloat32Workload, armnn::DataType::Float32>();
270 BOOST_AUTO_TEST_CASE(CreatePooling2dUint8Workload)
272 RefCreatePooling2dWorkloadTest<RefPooling2dUint8Workload, armnn::DataType::QuantisedAsymm8>();
275 template <typename SoftmaxWorkloadType, armnn::DataType DataType>
276 static void RefCreateSoftmaxWorkloadTest()
279 RefWorkloadFactory factory;
280 auto workload = CreateSoftmaxWorkloadTest<SoftmaxWorkloadType, DataType>(factory, graph);
282 // Checks that outputs and inputs are as we expect them (see definition of CreateSoftmaxWorkloadTest).
285 TensorInfo({4, 1}, DataType),
286 TensorInfo({4, 1}, DataType));
289 BOOST_AUTO_TEST_CASE(CreateSoftmaxFloat32Workload)
291 RefCreateSoftmaxWorkloadTest<RefSoftmaxFloat32Workload, armnn::DataType::Float32>();
294 BOOST_AUTO_TEST_CASE(CreateSoftmaxUint8Workload)
296 RefCreateSoftmaxWorkloadTest<RefSoftmaxUint8Workload, armnn::DataType::QuantisedAsymm8>();
299 template <typename SplitterWorkloadType, armnn::DataType DataType>
300 static void RefCreateSplitterWorkloadTest()
303 RefWorkloadFactory factory;
304 auto workload = CreateSplitterWorkloadTest<SplitterWorkloadType, DataType>(factory, graph);
306 // Checks that outputs are as we expect them (see definition of CreateSplitterWorkloadTest).
307 SplitterQueueDescriptor queueDescriptor = workload->GetData();
308 auto inputHandle = boost::polymorphic_downcast<ConstCpuTensorHandle*>(queueDescriptor.m_Inputs[0]);
309 BOOST_TEST((inputHandle->GetTensorInfo() == TensorInfo({ 5, 7, 7 }, DataType)));
311 auto outputHandle0 = boost::polymorphic_downcast<CpuTensorHandle*>(queueDescriptor.m_Outputs[0]);
312 BOOST_TEST((outputHandle0->GetTensorInfo() == TensorInfo({ 1, 7, 7 }, DataType)));
314 auto outputHandle1 = boost::polymorphic_downcast<CpuTensorHandle*>(queueDescriptor.m_Outputs[1]);
315 BOOST_TEST((outputHandle1->GetTensorInfo() == TensorInfo({ 2, 7, 7 }, DataType)));
317 auto outputHandle2 = boost::polymorphic_downcast<CpuTensorHandle*>(queueDescriptor.m_Outputs[2]);
318 BOOST_TEST((outputHandle2->GetTensorInfo() == TensorInfo({ 2, 7, 7 }, DataType)));
321 BOOST_AUTO_TEST_CASE(CreateSplitterFloat32Workload)
323 RefCreateSplitterWorkloadTest<RefSplitterFloat32Workload, armnn::DataType::Float32>();
326 BOOST_AUTO_TEST_CASE(CreateSplitterUint8Workload)
328 RefCreateSplitterWorkloadTest<RefSplitterUint8Workload, armnn::DataType::QuantisedAsymm8>();
331 template <typename SplitterWorkloadType, typename MergerWorkloadType, armnn::DataType DataType>
332 static void RefCreateSplitterMergerWorkloadTest()
334 // Tests that it is possible to decide which output of the splitter layer
335 // should be lined to which input of the merger layer.
336 // We tested that is is possible to specify 0th output
337 // of the splitter to be the 1st input to the merger and the 1st output of the splitter to be 0th input
341 RefWorkloadFactory factory;
342 auto workloads = CreateSplitterMergerWorkloadTest<SplitterWorkloadType, MergerWorkloadType, DataType>
345 auto wlSplitter = std::move(workloads.first);
346 auto wlMerger = std::move(workloads.second);
348 //Checks that the index of inputs/outputs matches what we declared on InputDescriptor construction.
349 armnn::CpuTensorHandle* sOut0 = dynamic_cast<armnn::CpuTensorHandle*>(wlSplitter->GetData().m_Outputs[0]);
350 armnn::CpuTensorHandle* sOut1 = dynamic_cast<armnn::CpuTensorHandle*>(wlSplitter->GetData().m_Outputs[1]);
351 armnn::CpuTensorHandle* mIn0 = dynamic_cast<armnn::CpuTensorHandle*>(wlMerger->GetData().m_Inputs[0]);
352 armnn::CpuTensorHandle* mIn1 = dynamic_cast<armnn::CpuTensorHandle*>(wlMerger->GetData().m_Inputs[1]);
359 bool validDataPointers = (sOut0 == mIn1) && (sOut1 == mIn0);
361 BOOST_TEST(validDataPointers);
364 BOOST_AUTO_TEST_CASE(CreateSplitterMergerFloat32)
366 RefCreateSplitterMergerWorkloadTest<RefSplitterFloat32Workload, RefMergerFloat32Workload, DataType::Float32>();
369 BOOST_AUTO_TEST_CASE(CreateSplitterMergerUint8)
371 RefCreateSplitterMergerWorkloadTest<RefSplitterUint8Workload, RefMergerUint8Workload, DataType::QuantisedAsymm8>();
374 template <typename SplitterWorkloadType, typename ActivationWorkloadType, armnn::DataType DataType>
375 static void RefCreateSingleOutputMultipleInputsTest()
377 // Tests that it is possible to assign multiple (two) different layers to each of the outputs of a splitter layer.
378 // We created a splitter with two outputs. That each of those outputs is used by two different activation layers.
381 RefWorkloadFactory factory;
382 std::unique_ptr<SplitterWorkloadType> wlSplitter;
383 std::unique_ptr<ActivationWorkloadType> wlActiv0_0;
384 std::unique_ptr<ActivationWorkloadType> wlActiv0_1;
385 std::unique_ptr<ActivationWorkloadType> wlActiv1_0;
386 std::unique_ptr<ActivationWorkloadType> wlActiv1_1;
388 CreateSplitterMultipleInputsOneOutputWorkloadTest<SplitterWorkloadType,
389 ActivationWorkloadType, DataType>(factory, graph, wlSplitter, wlActiv0_0, wlActiv0_1, wlActiv1_0, wlActiv1_1);
391 armnn::CpuTensorHandle* sOut0 = dynamic_cast<armnn::CpuTensorHandle*>(wlSplitter->GetData().m_Outputs[0]);
392 armnn::CpuTensorHandle* sOut1 = dynamic_cast<armnn::CpuTensorHandle*>(wlSplitter->GetData().m_Outputs[1]);
393 armnn::CpuTensorHandle* activ0_0Im = dynamic_cast<armnn::CpuTensorHandle*>(wlActiv0_0->GetData().m_Inputs[0]);
394 armnn::CpuTensorHandle* activ0_1Im = dynamic_cast<armnn::CpuTensorHandle*>(wlActiv0_1->GetData().m_Inputs[0]);
395 armnn::CpuTensorHandle* activ1_0Im = dynamic_cast<armnn::CpuTensorHandle*>(wlActiv1_0->GetData().m_Inputs[0]);
396 armnn::CpuTensorHandle* activ1_1Im = dynamic_cast<armnn::CpuTensorHandle*>(wlActiv1_1->GetData().m_Inputs[0]);
401 BOOST_TEST(activ0_0Im);
402 BOOST_TEST(activ0_1Im);
403 BOOST_TEST(activ1_0Im);
404 BOOST_TEST(activ1_1Im);
406 bool validDataPointers = (sOut0 == activ0_0Im) && (sOut0 == activ0_1Im) &&
407 (sOut1 == activ1_0Im) && (sOut1 == activ1_1Im);
409 BOOST_TEST(validDataPointers);
412 BOOST_AUTO_TEST_CASE(CreateSingleOutputMultipleInputsFloat32)
414 RefCreateSingleOutputMultipleInputsTest<RefSplitterFloat32Workload, RefActivationFloat32Workload,
415 armnn::DataType::Float32>();
418 BOOST_AUTO_TEST_CASE(CreateSingleOutputMultipleInputsUint8)
420 RefCreateSingleOutputMultipleInputsTest<RefSplitterUint8Workload, RefActivationUint8Workload,
421 armnn::DataType::QuantisedAsymm8>();
424 template <typename ResizeBilinearWorkloadType, armnn::DataType DataType>
425 static void RefCreateResizeBilinearTest(DataLayout dataLayout)
428 RefWorkloadFactory factory;
429 auto workload = CreateResizeBilinearWorkloadTest<ResizeBilinearWorkloadType, DataType>(factory, graph, dataLayout);
431 TensorShape inputShape;
432 TensorShape outputShape;
436 case DataLayout::NHWC:
437 inputShape = { 2, 4, 4, 3 };
438 outputShape = { 2, 2, 2, 3 };
441 inputShape = { 2, 3, 4, 4 };
442 outputShape = { 2, 3, 2, 2 };
445 // Checks that outputs and inputs are as we expect them (see definition of CreateResizeBilinearWorkloadTest).
448 TensorInfo(inputShape, DataType),
449 TensorInfo(outputShape, DataType));
452 BOOST_AUTO_TEST_CASE(CreateResizeBilinearFloat32)
454 RefCreateResizeBilinearTest<RefResizeBilinearFloat32Workload, armnn::DataType::Float32>(DataLayout::NCHW);
457 BOOST_AUTO_TEST_CASE(CreateResizeBilinearUint8)
459 RefCreateResizeBilinearTest<RefResizeBilinearUint8Workload, armnn::DataType::QuantisedAsymm8>(DataLayout::NCHW);
462 BOOST_AUTO_TEST_CASE(CreateResizeBilinearFloat32Nhwc)
464 RefCreateResizeBilinearTest<RefResizeBilinearFloat32Workload, armnn::DataType::Float32>(DataLayout::NHWC);
467 template <typename L2NormalizationWorkloadType, armnn::DataType DataType>
468 static void RefCreateL2NormalizationTest(DataLayout dataLayout)
471 RefWorkloadFactory factory;
473 CreateL2NormalizationWorkloadTest<L2NormalizationWorkloadType, DataType>(factory, graph, dataLayout);
475 TensorShape inputShape;
476 TensorShape outputShape;
480 case DataLayout::NHWC:
481 inputShape = { 5, 50, 67, 20 };
482 outputShape = { 5, 50, 67, 20 };
484 case DataLayout::NCHW:
486 inputShape = { 5, 20, 50, 67 };
487 outputShape = { 5, 20, 50, 67 };
491 // Checks that outputs and inputs are as we expect them (see definition of CreateL2NormalizationWorkloadTest).
492 CheckInputOutput(std::move(workload), TensorInfo(inputShape, DataType), TensorInfo(outputShape, DataType));
495 BOOST_AUTO_TEST_CASE(CreateL2NormalizationFloat32)
497 RefCreateL2NormalizationTest<RefL2NormalizationFloat32Workload, armnn::DataType::Float32>(DataLayout::NCHW);
500 BOOST_AUTO_TEST_CASE(CreateL2NormalizationFloat32Nhwc)
502 RefCreateL2NormalizationTest<RefL2NormalizationFloat32Workload, armnn::DataType::Float32>(DataLayout::NHWC);
505 template <typename ReshapeWorkloadType, armnn::DataType DataType>
506 static void RefCreateReshapeWorkloadTest()
509 RefWorkloadFactory factory;
510 auto workload = CreateReshapeWorkloadTest<ReshapeWorkloadType, DataType>(factory, graph);
512 // Checks that outputs and inputs are as we expect them (see definition of CreateReshapeWorkloadTest).
515 TensorInfo({ 4, 1 }, DataType),
516 TensorInfo({ 1, 4 }, DataType));
519 BOOST_AUTO_TEST_CASE(CreateReshapeFloat32Workload)
521 RefCreateReshapeWorkloadTest<RefReshapeFloat32Workload, armnn::DataType::Float32>();
524 BOOST_AUTO_TEST_CASE(CreateReshapeUint8Workload)
526 RefCreateReshapeWorkloadTest<RefReshapeUint8Workload, armnn::DataType::QuantisedAsymm8>();
529 BOOST_AUTO_TEST_SUITE_END()