#include "mkldnn_test_common.hpp"
#include "gtest/gtest.h"
-
#include "mkldnn.hpp"
+#include "test_convolution_depthwise_forward_common.hpp"
namespace mkldnn {
-template <typename T> inline T scale_shift_fwd(T s_val, T w_val, T b_val) {
- return s_val*w_val + b_val;
-}
-
-template <typename T> inline T prelu_fwd(T s_val, T w_val) {
- return s_val >= 0 ? s_val : w_val*s_val;
-}
-
-template <typename data_t_src, typename data_t_wei,
- typename data_t_acc, typename data_t_dst>
-void compute_ref_conv_depthwise_fwd(const test_convolution_sizes_t &c,
- const memory &src, const memory &weights, const memory &bias,
- const memory &dst, bool w_bias, algorithm depthwise_alg,
- const memory &depthwise_weights, const memory &depthwise_bias)
-{
- data_t_src *src_data = (data_t_src *)src.get_data_handle();
- data_t_wei *weights_data = (data_t_wei *)weights.get_data_handle();
- data_t_dst *bias_data
- = (data_t_dst *)(w_bias ? bias.get_data_handle() : nullptr);
- data_t_dst *dst_data = (data_t_dst *)dst.get_data_handle();
-
- data_t_dst *d_weights_data = (data_t_dst *)depthwise_weights.get_data_handle();
- data_t_dst *d_bias_data = (data_t_dst *)depthwise_bias.get_data_handle();
-
- const memory::desc src_d = src.get_primitive_desc().desc();
- const memory::desc weights_d = weights.get_primitive_desc().desc();
- const memory::desc dst_d = dst.get_primitive_desc().desc();
-
-#pragma omp parallel for collapse(5) schedule(static)
- for (int n = 0; n < c.mb; n++) {
- for (int g = 0; g < c.ng; g++) {
- for (int oc = 0; oc < c.oc / c.ng; oc++) {
- for (int oh = 0; oh < c.oh; oh++) {
- for (int ow = 0; ow < c.ow; ow++) {
- int oidx = n * c.oc * c.oh * c.ow
- + g * c.oc / c.ng * c.oh * c.ow
- + oc * c.oh * c.ow + oh * c.ow + ow;
-
- int didx = map_index(dst_d, oidx);
- int bidx = g * c.oc / c.ng + oc;
- dst_data[didx] = bias_data ?
- bias_data[map_index(
- bias.get_primitive_desc().desc(),
- bidx)] :
- data_t_dst{0};
- for (int ic = 0; ic < c.ic / c.ng; ic++) {
- for (int kh = 0; kh < c.kh; kh++) {
- for (int kw = 0; kw < c.kw; kw++) {
- int iw = ow * c.strw
- - c.padw + kw * (1 + c.dilw);
- int ih = oh * c.strh
- - c.padh + kh * (1 + c.dilh);
- if (iw < 0 || iw >= c.iw) continue;
- if (ih < 0 || ih >= c.ih) continue;
- int iidx = n * c.ic * c.ih * c.iw
- + g * c.ic / c.ng * c.ih * c.iw
- + ic * c.ih * c.iw + ih * c.iw + iw;
- int widx = g * c.oc / c.ng * c.ic
- / c.ng * c.kh * c.kw
- + oc * c.ic / c.ng * c.kh * c.kw
- + ic * c.kh * c.kw + kh * c.kw + kw;
-
- dst_data[didx]
- += src_data[map_index(src_d, iidx)]
- * weights_data[map_index(
- weights_d, widx)];
- }
- }
- }
-
- switch (depthwise_alg) {
- case depthwise_scale_shift:
- dst_data[didx] = scale_shift_fwd(dst_data[didx], d_weights_data[bidx], d_bias_data[bidx]);
- break;
- case depthwise_prelu:
- dst_data[didx] = prelu_fwd(dst_data[didx], d_weights_data[bidx]);
- break;
- default: assert(!"unknown alg_kind");
- }
- }
- }
- }
- }
- }
-}
-
-template <typename data_t_src, typename data_t_wei,
- typename data_t_acc, typename data_t_dst>
-class convolution_depthwise_test
- : public ::testing::TestWithParam<test_convolution_depthwise_params_t> {
-protected:
- virtual void SetUp()
- {
- test_convolution_depthwise_params_t p
- = ::testing::TestWithParam<
- test_convolution_depthwise_params_t>::GetParam();
-
- ASSERT_TRUE(p.engine_kind == engine::kind::cpu);
- ASSERT_EQ(p.aalgorithm, convolution_direct);
- auto eng = engine(p.engine_kind, 0);
-
- memory::data_type data_type_src = data_traits<data_t_src>::data_type;
- memory::data_type data_type_dst = data_traits<data_t_dst>::data_type;
- memory::data_type data_type_wei = data_traits<data_t_wei>::data_type;
-
- test_convolution_sizes_t cd = p.sizes;
-
- auto c_src_desc = create_md({ cd.mb, cd.ic, cd.ih, cd.iw },
- data_type_src, p.formats.src_format);
- auto c_weights_desc = cd.ng > 1 ?
- create_md({ cd.ng, cd.oc / cd.ng, cd.ic / cd.ng, cd.kh, cd.kw },
- data_type_wei, p.formats.weights_format) :
- create_md({ cd.oc, cd.ic, cd.kh, cd.kw },
- data_type_wei, p.formats.weights_format);
- auto c_dst_desc = create_md({ cd.mb, cd.oc, cd.oh, cd.ow },
- data_type_dst, p.formats.dst_format);
-
- auto c_src = memory({c_src_desc, eng});
- auto c_weights = memory({c_weights_desc, eng});
- auto c_dst = memory({c_dst_desc, eng});
-
- auto dst_ref = memory({c_dst_desc, eng});
-
- fill_data<data_t_src>(c_src.get_primitive_desc().get_size()
- / sizeof(data_t_src), (data_t_src *)c_src.get_data_handle(), data_t_src(0), data_t_src(1));
-
- fill_data<data_t_wei>(
- c_weights.get_primitive_desc().get_size()
- / sizeof(data_t_wei),(data_t_wei *)c_weights.get_data_handle(), data_t_wei(0), data_t_wei(1));
-
- bool with_bias = p.formats.bias_format != memory::format::format_undef;
- auto c_bias_desc = with_bias ?
- create_md({ cd.oc }, data_type_dst, p.formats.bias_format) :
- create_md({}, data_type_dst, p.formats.bias_format);
- auto c_bias = memory({c_bias_desc, eng});
- if (with_bias) {
- fill_data<data_t_dst>(
- c_bias.get_primitive_desc().get_size() / sizeof(data_t_dst),
- (data_t_dst *)c_bias.get_data_handle(), 1., true);
- }
-
- std::vector<int> padR = { cd.padh, cd.padw };
- for (int i = 0; i < 2; ++i) {
- if ((cd.ih - ((cd.kh - 1) * (cd.dilh + 1) + 1) + cd.padh + padR[0])
- / cd.strh + 1 != cd.oh)
- ++padR[0];
- if ((cd.iw - ((cd.kw - 1) * (cd.dilw + 1) + 1) + cd.padw + padR[1])
- / cd.strw + 1 != cd.ow)
- ++padR[1];
- }
-
- auto c_depthwise_weights_desc = create_md({ cd.oc }, data_type_dst, memory::x);
- auto c_depthwise_bias_desc = create_md({ cd.oc }, data_type_dst, memory::x);
-
- auto c_depthwise_weights = memory({c_depthwise_weights_desc, eng});
- auto c_depthwise_bias = memory({c_depthwise_bias_desc, eng});
-
- fill_data<data_t_dst>(
- c_depthwise_weights.get_primitive_desc().get_size() / sizeof(data_t_dst),
- (data_t_dst *)c_depthwise_weights.get_data_handle(), 1., true);
- fill_data<data_t_dst>(
- c_depthwise_bias.get_primitive_desc().get_size() / sizeof(data_t_dst),
- (data_t_dst *)c_depthwise_bias.get_data_handle(), 1., true);
-
- auto test = [&]() {
- mkldnn::post_ops ops;
- ops.append_depthwise(p.alg, static_cast<const float*>(c_depthwise_weights.get_data_handle()),
- static_cast<const float*>(c_depthwise_bias.get_data_handle()));
-
- mkldnn::primitive_attr attr;
- attr.set_post_ops(ops);
-
- auto conv_desc = with_bias
- ? convolution_forward::desc(prop_kind::forward_scoring,
- p.aalgorithm, c_src_desc, c_weights_desc, c_bias_desc,
- c_dst_desc, { cd.strh, cd.strw }, { cd.dilh, cd.dilw },
- { cd.padh, cd.padw }, padR, padding_kind::zero)
- : convolution_forward::desc(prop_kind::forward_scoring,
- p.aalgorithm, c_src_desc, c_weights_desc, c_dst_desc,
- { cd.strh, cd.strw }, { cd.dilh, cd.dilw },
- { cd.padh, cd.padw }, padR, padding_kind::zero);
-
- auto conv_primitive_desc =
- convolution_forward::primitive_desc(conv_desc, attr, eng);
-
- auto conv = with_bias
- ? convolution_forward(conv_primitive_desc,
- c_src, c_weights, c_bias, c_dst)
- : convolution_forward(conv_primitive_desc,
- c_src, c_weights, c_dst);
- std::vector<primitive> pipeline;
- pipeline.push_back(conv);
-
- stream(stream::kind::lazy).submit(pipeline).wait();
- };
-
- if (catch_expected_failures(test, p.expect_to_fail, p.expected_status))
- return;
-
- compute_ref_conv_depthwise_fwd<data_t_src, data_t_wei, data_t_wei,
- data_t_dst>(cd, c_src, c_weights, c_bias, dst_ref, with_bias,
- p.alg, c_depthwise_weights, c_depthwise_bias);
- compare_data<data_t_dst>(dst_ref, c_dst, 1e-3);
- }
-};
-
using convolution_test = convolution_depthwise_test<float, float, float, float>;
TEST_P(convolution_test, TestConvolution)
{ mkldnn::memory::format::src, mkldnn::memory::format::weights, \
mkldnn::memory::format::bias, mkldnn::memory::format::dst }
-#define FMT_WEIGHTS_BLOCKED OIhw8i8o
+#define FMT_WEIGHTS_BLOCKED8 OIhw8i8o
+#define FMT_WEIGHTS_BLOCKED8_DW Goihw8g
#define FMT_WEIGHTS_BLOCKED16 OIhw16i16o
+#define FMT_WEIGHTS_BLOCKED16_DW Goihw16g
#define ENGINE mkldnn::engine::kind::cpu
#define ALGORITHM mkldnn::convolution_direct
EXPAND_ARGS(PARAMS_CONV(depthwise_scale_shift, __VA_ARGS__)), \
EXPAND_ARGS(PARAMS_CONV(depthwise_prelu, __VA_ARGS__))
-
#define PARAMS_CONV(alg, src, weights, bias, dst, ...) \
test_convolution_depthwise_params_t {alg, ENGINE, ALGORITHM, \
EXPAND_FORMATS(src, weights, bias, dst), /* empty attributes */ {}, \
2, 32, 32, 9, 9, 32, 9, 9, 1, 1, 0, 0, 1, 1)
);
- INST_TEST_CASE(SimpleSmall_Blocked,
- PARAMS(nChw8c, OIhw8i8o, x, nChw8c,
+ INST_TEST_CASE(SimpleSmall_Blocked8,
+ PARAMS(nChw8c, FMT_WEIGHTS_BLOCKED8, x, nChw8c,
2, 1, 32, 13, 13, 48, 11, 11, 3, 3, 0, 0, 1, 1),
- PARAMS(nChw8c, OIhw8i8o, x, nChw8c,
+ PARAMS(nChw8c, FMT_WEIGHTS_BLOCKED8, x, nChw8c,
2, 1, 16, 13, 13, 48, 13, 13, 1, 1, 0, 0, 1, 1),
- PARAMS(nChw8c, Goihw8g, x, nChw8c,
+ PARAMS(nChw8c, FMT_WEIGHTS_BLOCKED8_DW, x, nChw8c,
2, 64, 64, 16, 16, 64, 16, 16, 3, 3, 0, 0, 1, 1),
- PARAMS(nChw8c, Goihw8g, x, nChw8c,
+ PARAMS(nChw8c, FMT_WEIGHTS_BLOCKED8_DW, x, nChw8c,
2, 32, 32, 9, 9, 32, 9, 9, 1, 1, 0, 0, 1, 1)
);
INST_TEST_CASE(SimpleSmall_Blocked16,
- PARAMS(nChw16c, OIhw16i16o, x, nChw16c,
+ PARAMS(nChw16c, FMT_WEIGHTS_BLOCKED16, x, nChw16c,
2, 1, 32, 13, 13, 48, 11, 11, 3, 3, 0, 0, 1, 1),
- PARAMS(nChw16c, OIhw16i16o, x, nChw16c,
+ PARAMS(nChw16c, FMT_WEIGHTS_BLOCKED16, x, nChw16c,
2, 1, 16, 13, 13, 48, 13, 13, 1, 1, 0, 0, 1, 1),
- PARAMS(nChw16c, Goihw16g, x, nChw16c,
+ PARAMS(nChw16c, FMT_WEIGHTS_BLOCKED16_DW, x, nChw16c,
2, 64, 64, 16, 16, 64, 16, 16, 3, 3, 0, 0, 1, 1),
- PARAMS(nChw16c, Goihw16g, x, nChw16c,
+ PARAMS(nChw16c, FMT_WEIGHTS_BLOCKED16_DW, x, nChw16c,
2, 32, 32, 9, 9, 32, 9, 9, 1, 1, 0, 0, 1, 1)
);
}