arm_compute v18.05
[platform/upstream/armcl.git] / examples / graph_vgg19.cpp
1 /*
2  * Copyright (c) 2017-2018 ARM Limited.
3  *
4  * SPDX-License-Identifier: MIT
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to
8  * deal in the Software without restriction, including without limitation the
9  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10  * sell copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in all
14  * copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  */
24 #include "arm_compute/graph.h"
25 #include "support/ToolchainSupport.h"
26 #include "utils/GraphUtils.h"
27 #include "utils/Utils.h"
28
29 #include <cstdlib>
30
31 using namespace arm_compute::utils;
32 using namespace arm_compute::graph::frontend;
33 using namespace arm_compute::graph_utils;
34
35 /** Example demonstrating how to implement VGG19's network using the Compute Library's graph API
36  *
37  * @param[in] argc Number of arguments
38  * @param[in] argv Arguments ( [optional] Target (0 = NEON, 1 = OpenCL, 2 = OpenCL with Tuner), [optional] Path to the weights folder, [optional] image, [optional] labels, [optional] Fast math for convolution layer (0 = DISABLED, 1 = ENABLED) )
39  */
40 class GraphVGG19Example : public Example
41 {
42 public:
43     void do_setup(int argc, char **argv) override
44     {
45         std::string data_path; /* Path to the trainable data */
46         std::string image;     /* Image data */
47         std::string label;     /* Label data */
48
49         // Create a preprocessor object
50         const std::array<float, 3> mean_rgb{ { 123.68f, 116.779f, 103.939f } };
51         std::unique_ptr<IPreprocessor> preprocessor = arm_compute::support::cpp14::make_unique<CaffePreproccessor>(mean_rgb);
52
53         // Set target. 0 (NEON), 1 (OpenCL), 2 (OpenCL with Tuner). By default it is NEON
54         const int    target         = argc > 1 ? std::strtol(argv[1], nullptr, 10) : 0;
55         Target       target_hint    = set_target_hint(target);
56         FastMathHint fast_math_hint = FastMathHint::DISABLED;
57         const bool   is_opencl      = target_hint == Target::CL;
58
59         ConvolutionMethod first_convolution3x3_hint = is_opencl ? ConvolutionMethod::DIRECT : ConvolutionMethod::GEMM;
60         ConvolutionMethod convolution3x3_hint       = ConvolutionMethod::DEFAULT;
61
62         // Parse arguments
63         if(argc < 2)
64         {
65             // Print help
66             std::cout << "Usage: " << argv[0] << " [target] [path_to_data] [image] [labels] [fast_math_hint]\n\n";
67             std::cout << "No data folder provided: using random values\n\n";
68         }
69         else if(argc == 2)
70         {
71             std::cout << "Usage: " << argv[0] << " " << argv[1] << " [path_to_data] [image] [labels] [fast_math_hint]\n\n";
72             std::cout << "No data folder provided: using random values\n\n";
73         }
74         else if(argc == 3)
75         {
76             data_path = argv[2];
77             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " [image] [labels] [fast_math_hint]\n\n";
78             std::cout << "No image provided: using random values\n\n";
79         }
80         else if(argc == 4)
81         {
82             data_path = argv[2];
83             image     = argv[3];
84             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " " << argv[3] << " [labels] [fast_math_hint]\n\n";
85             std::cout << "No text file with labels provided: skipping output accessor\n\n";
86         }
87         else if(argc == 5)
88         {
89             data_path = argv[2];
90             image     = argv[3];
91             label     = argv[4];
92             std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " " << argv[3] << " " << argv[4] << " [fast_math_hint]\n\n";
93             std::cout << "No fast math info provided: disabling fast math\n\n";
94         }
95         else
96         {
97             data_path      = argv[2];
98             image          = argv[3];
99             label          = argv[4];
100             fast_math_hint = (std::strtol(argv[5], nullptr, 1) == 0) ? FastMathHint::DISABLED : FastMathHint::ENABLED;
101         }
102
103         graph << target_hint
104               << first_convolution3x3_hint
105               << fast_math_hint
106               << InputLayer(TensorDescriptor(TensorShape(224U, 224U, 3U, 1U), DataType::F32),
107                             get_input_accessor(image, std::move(preprocessor)))
108               // Layer 1
109               << ConvolutionLayer(
110                   3U, 3U, 64U,
111                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv1_1_w.npy"),
112                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv1_1_b.npy"),
113                   PadStrideInfo(1, 1, 1, 1))
114               .set_name("conv1_1")
115               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv1_1/Relu")
116               << convolution3x3_hint
117               << ConvolutionLayer(
118                   3U, 3U, 64U,
119                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv1_2_w.npy"),
120                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv1_2_b.npy"),
121                   PadStrideInfo(1, 1, 1, 1))
122               .set_name("conv1_2")
123               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv1_2/Relu")
124               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 2, PadStrideInfo(2, 2, 0, 0))).set_name("pool1")
125               // Layer 2
126               << ConvolutionLayer(
127                   3U, 3U, 128U,
128                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv2_1_w.npy"),
129                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv2_1_b.npy"),
130                   PadStrideInfo(1, 1, 1, 1))
131               .set_name("conv2_1")
132               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv2_1/Relu")
133               << ConvolutionLayer(
134                   3U, 3U, 128U,
135                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv2_2_w.npy"),
136                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv2_2_b.npy"),
137                   PadStrideInfo(1, 1, 1, 1))
138               .set_name("conv2_2")
139               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv2_2/Relu")
140               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 2, PadStrideInfo(2, 2, 0, 0))).set_name("pool2")
141               // Layer 3
142               << ConvolutionLayer(
143                   3U, 3U, 256U,
144                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_1_w.npy"),
145                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_1_b.npy"),
146                   PadStrideInfo(1, 1, 1, 1))
147               .set_name("conv3_1")
148               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv3_1/Relu")
149               << ConvolutionLayer(
150                   3U, 3U, 256U,
151                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_2_w.npy"),
152                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_2_b.npy"),
153                   PadStrideInfo(1, 1, 1, 1))
154               .set_name("conv3_2")
155               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv3_2/Relu")
156               << ConvolutionLayer(
157                   3U, 3U, 256U,
158                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_3_w.npy"),
159                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_3_b.npy"),
160                   PadStrideInfo(1, 1, 1, 1))
161               .set_name("conv3_3")
162               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv3_3/Relu")
163               << ConvolutionLayer(
164                   3U, 3U, 256U,
165                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_4_w.npy"),
166                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv3_4_b.npy"),
167                   PadStrideInfo(1, 1, 1, 1))
168               .set_name("conv3_4")
169               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv3_4/Relu")
170               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 2, PadStrideInfo(2, 2, 0, 0))).set_name("pool3")
171               // Layer 4
172               << ConvolutionLayer(
173                   3U, 3U, 512U,
174                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_1_w.npy"),
175                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_1_b.npy"),
176                   PadStrideInfo(1, 1, 1, 1))
177               .set_name("conv4_1")
178               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv4_1/Relu")
179               << ConvolutionLayer(
180                   3U, 3U, 512U,
181                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_2_w.npy"),
182                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_2_b.npy"),
183                   PadStrideInfo(1, 1, 1, 1))
184               .set_name("conv4_2")
185               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv4_2/Relu")
186               << ConvolutionLayer(
187                   3U, 3U, 512U,
188                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_3_w.npy"),
189                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_3_b.npy"),
190                   PadStrideInfo(1, 1, 1, 1))
191               .set_name("conv4_3")
192               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv4_3/Relu")
193               << ConvolutionLayer(
194                   3U, 3U, 512U,
195                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_4_w.npy"),
196                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv4_4_b.npy"),
197                   PadStrideInfo(1, 1, 1, 1))
198               .set_name("conv4_4")
199               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv4_4/Relu")
200               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 2, PadStrideInfo(2, 2, 0, 0))).set_name("pool4")
201               // Layer 5
202               << ConvolutionLayer(
203                   3U, 3U, 512U,
204                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_1_w.npy"),
205                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_1_b.npy"),
206                   PadStrideInfo(1, 1, 1, 1))
207               .set_name("conv5_1")
208               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv5_1/Relu")
209               << ConvolutionLayer(
210                   3U, 3U, 512U,
211                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_2_w.npy"),
212                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_2_b.npy"),
213                   PadStrideInfo(1, 1, 1, 1))
214               .set_name("conv5_2")
215               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv5_2/Relu")
216               << ConvolutionLayer(
217                   3U, 3U, 512U,
218                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_3_w.npy"),
219                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_3_b.npy"),
220                   PadStrideInfo(1, 1, 1, 1))
221               .set_name("conv5_3")
222               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv5_3/Relu")
223               << ConvolutionLayer(
224                   3U, 3U, 512U,
225                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_4_w.npy"),
226                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/conv5_4_b.npy"),
227                   PadStrideInfo(1, 1, 1, 1))
228               .set_name("conv5_4")
229               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("conv5_4/Relu")
230               << PoolingLayer(PoolingLayerInfo(PoolingType::MAX, 2, PadStrideInfo(2, 2, 0, 0))).set_name("pool5")
231               // Layer 6
232               << FullyConnectedLayer(
233                   4096U,
234                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc6_w.npy"),
235                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc6_b.npy"))
236               .set_name("fc6")
237               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("Relu")
238               // Layer 7
239               << FullyConnectedLayer(
240                   4096U,
241                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc7_w.npy"),
242                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc7_b.npy"))
243               .set_name("fc7")
244               << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::RELU)).set_name("Relu_1")
245               // Layer 8
246               << FullyConnectedLayer(
247                   1000U,
248                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc8_w.npy"),
249                   get_weights_accessor(data_path, "/cnn_data/vgg19_model/fc8_b.npy"))
250               .set_name("fc8")
251               // Softmax
252               << SoftmaxLayer().set_name("prob")
253               << OutputLayer(get_output_accessor(label, 5));
254
255         // Finalize graph
256         GraphConfig config;
257         config.use_tuner = (target == 2);
258         graph.finalize(target_hint, config);
259     }
260     void do_run() override
261     {
262         // Run graph
263         graph.run();
264     }
265
266 private:
267     Stream graph{ 0, "VGG19" };
268 };
269
270 /** Main program for VGG19
271  *
272  * @param[in] argc Number of arguments
273  * @param[in] argv Arguments ( [optional] Target (0 = NEON, 1 = OpenCL, 2 = OpenCL with Tuner), [optional] Path to the weights folder, [optional] image, [optional] labels, [optional] Fast math for convolution layer (0 = DISABLED, 1 = ENABLED) )
274  */
275 int main(int argc, char **argv)
276 {
277     return arm_compute::utils::run_example<GraphVGG19Example>(argc, argv);
278 }