1 /*
2 * Copyright (c) 2019-2020 Arm Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24 #include "src/core/NEON/kernels/NEDepthwiseConvolutionLayerNativeKernel.h"
25 #include "tests/NEON/Accessor.h"
26 #include "tests/NEON/Helper.h"
27 #include "tests/framework/Macros.h"
28 #include "tests/framework/datasets/Datasets.h"
29 #include "tests/validation/Validation.h"
30 #include "tests/validation/fixtures/DepthwiseConvolutionLayerFixture.h"
31
32 namespace arm_compute
33 {
34 namespace test
35 {
36 namespace validation
37 {
38 using namespace arm_compute::misc::shape_calculator;
39
40 // Create function for NEDepthwiseConvolutionLayerKernel
41 using NEDepthwiseConvolutionLayerNative = NESynthetizeFunctionWithZeroConstantKernelBorder<NEDepthwiseConvolutionLayerNativeKernel>;
42
43 // Fixture for NEDepthwiseConvolutionLayerKernel
44 template <typename T>
45 using NEDepthwiseConvolutionLayerNativeFixture = DepthwiseConvolutionLayerNativeValidationFixture<Tensor, Accessor, NEDepthwiseConvolutionLayerNative, T>;
46
47 namespace
48 {
49 // *INDENT-OFF*
50 // clang-format off
51 RelativeTolerance<float> rel_tolerance_f32(0.001f);
52 constexpr float abs_tolerance_f32(0.0001f);
53
54 /** Width values to test - Precommit */
55 const auto width_values_precommit = framework::dataset::make("width", { 17U } );
56
57 /** Width values to test - Nightly */
58 const auto width_values_nightly = framework::dataset::make("width", { 53U, 47U } );
59
60 /** Height values to test - Precommit */
61 const auto height_values_precommit = framework::dataset::make("height", { 19U } );
62
63 /** Height values to test - Nightly */
64 const auto height_values_nightly = framework::dataset::make("height", { 39U, 43U } );
65
66 /** Channel values to test - Precommit */
67 const auto channel_values_precommit = framework::dataset::make("channels", { 15U });
68
69 /** Channel values to test - Nightly */
70 const auto channel_values_nightly = framework::dataset::make("channels", { 33U, 19U });
71
72 /** Batch values to test - Precommit */
73 const auto batch_values_precommit = framework::dataset::make("batch", { 1U, 2U });
74
75 /** Batch values to test - Nightly */
76 const auto batch_values_nightly = framework::dataset::make("batch", { 1U, 3U });
77
78 /** Kernel size values to test - Precommit */
79 const auto kernel_sz_values_precommit = framework::dataset::make("kernel_size", { Size2D(1U, 1U), Size2D(1U, 3U) });
80
81 /** Kernel size values to test - Nightly */
82 const auto kernel_sz_values_nightly = framework::dataset::make("kernel_size", { Size2D(3U, 5U), Size2D(5U, 1U), Size2D(1U, 7U), Size2D(9U, 7U) });
83
84 /** Depth multiplier values to test - All */
85 const auto depth_multiplier_values = framework::dataset::make("depth_multiplier", { 1U, 3U });
86
87 /** Dilation values to test - All */
88 const auto dilation_values = framework::dataset::make("dilation", { Size2D(1U, 1U), Size2D(3U, 3U) });
89
90 /** Stride values to test - All */
91 const auto stride_values = framework::dataset::make("stride", { Size2D(1U, 1U), Size2D(3U, 2U) });
92
93 /** Padding values to test - All */
94 const auto padding_valid_values = framework::dataset::make("padding_valid", { true, false });
95
96 /** Data type values to test - All */
97 const auto data_type_values = framework::dataset::make("data_type", { DataType::F32 });
98
99 /** Data layout values to test - All */
100 const auto data_layout_values = framework::dataset::make("data_layout", { DataLayout::NHWC });
101 } // namespace
102
103 TEST_SUITE(NEON)
TEST_SUITE(DepthwiseConvolutionLayerNative)104 TEST_SUITE(DepthwiseConvolutionLayerNative)
105
106 TEST_CASE(ValidateNoPadding, framework::DatasetMode::ALL)
107 {
108 // this test case will ensure that the kernel is not adding implicit padding
109 constexpr uint32_t vector_size = 8; // Asummed vector size of the current native kernel
110 constexpr auto depth = vector_size * 2 + 1; // mis-aligned depth to force padding if exists.
111 constexpr auto data_layout = DataLayout::NHWC;
112 constexpr auto data_type = DataType::F32;
113
114 const auto input_size = Size2D{ 100, 100 }; // random plane size of the input
115 const auto kernel_size = Size2D{ 4, 4 }; // random plane size of the kernel
116 const auto pad_stride_info = PadStrideInfo(3, 3); // random convolution information to
117
118 TensorShape src_shape{ depth, input_size.x(), input_size.y() };
119 TensorShape weights_shape{ depth, kernel_size.x(), kernel_size.y() };
120 TensorShape bias_shape{ depth };
121
122 auto src = create_tensor<Tensor>(src_shape, data_type, 1, QuantizationInfo(), data_layout);
123 auto weights = create_tensor<Tensor>(weights_shape, data_type, 1, QuantizationInfo(), data_layout);
124 auto biases = create_tensor<Tensor>(bias_shape, data_type, 1, QuantizationInfo(), data_layout);
125 auto dst = create_tensor<Tensor>(TensorShape(), data_type, 1, QuantizationInfo(), data_layout);
126
127 NEDepthwiseConvolutionLayerNativeKernel dwc;
128 dwc.configure(&src, &weights, &biases, &dst, pad_stride_info);
129
130 ARM_COMPUTE_EXPECT(src.info()->padding().empty(), framework::LogLevel::ERRORS);
131 ARM_COMPUTE_EXPECT(weights.info()->padding().empty(), framework::LogLevel::ERRORS);
132 ARM_COMPUTE_EXPECT(biases.info()->padding().empty(), framework::LogLevel::ERRORS);
133 ARM_COMPUTE_EXPECT(dst.info()->padding().empty(), framework::LogLevel::ERRORS);
134 }
135
136 TEST_SUITE(Float)
TEST_SUITE(FP32)137 TEST_SUITE(FP32)
138 FIXTURE_DATA_TEST_CASE(RunSmall, NEDepthwiseConvolutionLayerNativeFixture<float>, framework::DatasetMode::ALL,
139 combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_precommit,
140 height_values_precommit),
141 channel_values_precommit),
142 batch_values_precommit),
143 kernel_sz_values_precommit),
144 depth_multiplier_values),
145 dilation_values),
146 stride_values),
147 padding_valid_values),
148 data_type_values),
149 data_layout_values))
150 {
151 // Validate output
152 validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
153 }
154
FIXTURE_DATA_TEST_CASE(RunLarge,NEDepthwiseConvolutionLayerNativeFixture<float>,framework::DatasetMode::NIGHTLY,combine (combine (combine (combine (combine (combine (combine (combine (combine (combine (width_values_nightly,height_values_nightly),channel_values_nightly),batch_values_nightly),kernel_sz_values_nightly),depth_multiplier_values),dilation_values),stride_values),padding_valid_values),data_type_values),data_layout_values))155 FIXTURE_DATA_TEST_CASE(RunLarge, NEDepthwiseConvolutionLayerNativeFixture<float>, framework::DatasetMode::NIGHTLY,
156 combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(width_values_nightly,
157 height_values_nightly),
158 channel_values_nightly),
159 batch_values_nightly),
160 kernel_sz_values_nightly),
161 depth_multiplier_values),
162 dilation_values),
163 stride_values),
164 padding_valid_values),
165 data_type_values),
166 data_layout_values))
167 {
168 // Validate output
169 validate(Accessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);
170 }
171
172 TEST_SUITE_END() // FP32
173 TEST_SUITE_END() // Float
174 TEST_SUITE_END() // DepthwiseConvolutionLayerNative
175 TEST_SUITE_END() // NEON
176 } // namespace validation
177 } // namespace test
178 } // namespace arm_compute