/cmsis-nn-latest/Source/PoolingFunctions/ |
D | arm_avgpool_get_buffer_sizes_s16.c | 42 int32_t arm_avgpool_s16_get_buffer_size(const int output_x, const int ch_src) in arm_avgpool_s16_get_buffer_size() argument 45 return arm_avgpool_s16_get_buffer_size_mve(output_x, ch_src); in arm_avgpool_s16_get_buffer_size() 47 return arm_avgpool_s16_get_buffer_size_dsp(output_x, ch_src); in arm_avgpool_s16_get_buffer_size() 49 (void)output_x; in arm_avgpool_s16_get_buffer_size() 55 int32_t arm_avgpool_s16_get_buffer_size_dsp(const int output_x, const int ch_src) in arm_avgpool_s16_get_buffer_size_dsp() argument 57 (void)output_x; in arm_avgpool_s16_get_buffer_size_dsp() 61 int32_t arm_avgpool_s16_get_buffer_size_mve(const int output_x, const int ch_src) in arm_avgpool_s16_get_buffer_size_mve() argument 63 (void)output_x; in arm_avgpool_s16_get_buffer_size_mve()
|
D | arm_avgpool_get_buffer_sizes_s8.c | 42 int32_t arm_avgpool_s8_get_buffer_size(const int output_x, const int ch_src) in arm_avgpool_s8_get_buffer_size() argument 45 return arm_avgpool_s8_get_buffer_size_mve(output_x, ch_src); in arm_avgpool_s8_get_buffer_size() 47 return arm_avgpool_s8_get_buffer_size_dsp(output_x, ch_src); in arm_avgpool_s8_get_buffer_size() 49 (void)output_x; in arm_avgpool_s8_get_buffer_size() 55 int32_t arm_avgpool_s8_get_buffer_size_dsp(const int output_x, const int ch_src) in arm_avgpool_s8_get_buffer_size_dsp() argument 57 (void)output_x; in arm_avgpool_s8_get_buffer_size_dsp() 61 int32_t arm_avgpool_s8_get_buffer_size_mve(const int output_x, const int ch_src) in arm_avgpool_s8_get_buffer_size_mve() argument 63 (void)output_x; in arm_avgpool_s8_get_buffer_size_mve()
|
D | arm_avgpool_s16.c | 84 const int32_t output_x = output_dims->w; in arm_avgpool_s16() local 105 const int32_t batch_output = output_x * output_y * ch_src; in arm_avgpool_s16() 111 for (int i_x = 0; i_x < output_x; i_x++) in arm_avgpool_s16() 120 int16_t *out = &dst[ch_src * (i_x + i_y * output_x)]; in arm_avgpool_s16() 215 for (int i_x = 0, idx_x = -pad_x; i_x < output_x; idx_x += stride_x, i_x++) in arm_avgpool_s16() 271 const int32_t batch_output = output_x * output_y * ch_src; in arm_avgpool_s16() 278 for (int i_x = 0, base_idx_x = -pad_x; i_x < output_x; base_idx_x += stride_x, i_x++) in arm_avgpool_s16() 312 dst[i_ch_in + ch_src * (i_x + i_y * output_x)] = sum; in arm_avgpool_s16()
|
D | arm_avgpool_s8.c | 86 const int32_t output_x = output_dims->w; in arm_avgpool_s8() local 97 const int32_t batch_output = output_x * output_y * ch_src; in arm_avgpool_s8() 109 for (int i_x = 0; i_x < output_x; i_x++) in arm_avgpool_s8() 118 int8_t *out = &dst[ch_src * (i_x + i_y * output_x)]; in arm_avgpool_s8() 247 const int32_t output_x = output_dims->w; in arm_avgpool_s8() local 279 for (int i_x = 0, idx_x = -pad_x; i_x < output_x; idx_x += stride_x, i_x++) in arm_avgpool_s8() 337 const int32_t batch_output = output_x * output_y * ch_src; in arm_avgpool_s8() 343 for (int i_x = 0; i_x < output_x; i_x++) in arm_avgpool_s8() 371 dst[i_ch_in + ch_src * (i_x + i_y * output_x)] = sum; in arm_avgpool_s8()
|
D | arm_max_pool_s16.c | 157 const int32_t output_x = output_dims->w; in arm_max_pool_s16() local 182 for (int i_x = 0, base_idx_x = -pad_x; i_x < output_x; base_idx_x += stride_x, i_x++) in arm_max_pool_s16() 216 clamp_output(dst_base, output_x * output_y * channel_in, act_min, act_max); in arm_max_pool_s16()
|
D | arm_max_pool_s8.c | 174 const int32_t output_x = output_dims->w; in arm_max_pool_s8() local 198 for (int i_x = 0, base_idx_x = -pad_x; i_x < output_x; base_idx_x += stride_x, i_x++) in arm_max_pool_s8() 232 clamp_output(dst_base, output_x * output_y * channel_in, act_min, act_max); in arm_max_pool_s8()
|
/cmsis-nn-latest/Source/ConcatenationFunctions/ |
D | arm_concatenation_s8_x.c | 55 const uint16_t output_x, in arm_concatenation_s8_x() argument 69 output += output_x; in arm_concatenation_s8_x()
|
/cmsis-nn-latest/Source/ConvolutionFunctions/ |
D | arm_transpose_conv_s8.c | 78 const int32_t output_x = output_dims->w; in arm_transpose_conv_s8() local 112 … arm_memset_s8((int8_t *)img_buf_ptr, 0, output_x * output_y * output_ch * sizeof(int32_t)); in arm_transpose_conv_s8() 118 for (int i = 0; i < output_x * output_y; i++) in arm_transpose_conv_s8() 148 const int32_t col_x = (output_x + pad_x_offset + pad_x - kernel_x) / stride_x + 1; in arm_transpose_conv_s8() 155 int32_t *dst_data = img_data + (i_pad_y * output_x + i_pad_x) * output_ch; in arm_transpose_conv_s8() 161 … if (i_ker_y >= 0 && i_ker_y < output_y && i_ker_x >= 0 && i_ker_x < output_x) in arm_transpose_conv_s8() 171 dst_data += (output_x - kernel_x) * output_ch; in arm_transpose_conv_s8() 176 for (int i = 0; i < output_x * output_y; i++) in arm_transpose_conv_s8()
|
D | arm_convolve_1_x_n_s4.c | 75 const uint16_t output_x = output_dims->w; in arm_convolve_1_x_n_s4() local 82 const int32_t total_pad = ((output_x - 1) * stride_x + kernel_x - input_x); in arm_convolve_1_x_n_s4() 92 const int32_t no_pad_num = MAX(output_x - (right_pad_num + left_pad_num), 0); in arm_convolve_1_x_n_s4() 94 if (right_pad_num + no_pad_num + left_pad_num != output_x) in arm_convolve_1_x_n_s4() 154 lhs_rows = output_x - out_idx; in arm_convolve_1_x_n_s4() 161 for (int i = out_idx; i < output_x; i++) in arm_convolve_1_x_n_s4()
|
D | arm_convolve_1_x_n_s8.c | 74 const int32_t output_x = output_dims->w; in arm_convolve_1_x_n_s8() local 80 const int32_t total_pad = ((output_x - 1) * stride_x + kernel_x - input_x); in arm_convolve_1_x_n_s8() 90 const int32_t no_pad_num = MAX(output_x - (right_pad_num + left_pad_num), 0); in arm_convolve_1_x_n_s8() 99 if (right_pad_num + no_pad_num + left_pad_num != output_x) in arm_convolve_1_x_n_s8() 177 lhs_rows = output_x - out_idx; in arm_convolve_1_x_n_s8()
|
D | arm_convolve_get_buffer_sizes_s4.c | 63 const int32_t output_x = output_dims->w; in arm_convolve_1_x_n_s4_get_buffer_size_mve() local 65 const int32_t total_pad = ((output_x - 1) * stride_x + kernel_x - input_x); in arm_convolve_1_x_n_s4_get_buffer_size_mve() 70 const int32_t no_pad_num = MAX(output_x - (right_pad_num + left_pad_num), 0); in arm_convolve_1_x_n_s4_get_buffer_size_mve() 72 if (right_pad_num + no_pad_num + left_pad_num != output_x) in arm_convolve_1_x_n_s4_get_buffer_size_mve()
|
D | arm_convolve_get_buffer_sizes_s8.c | 63 const int32_t output_x = output_dims->w; in arm_convolve_1_x_n_s8_get_buffer_size_mve() local 65 const int32_t total_pad = ((output_x - 1) * stride_x + kernel_x - input_x); in arm_convolve_1_x_n_s8_get_buffer_size_mve() 70 const int32_t no_pad_num = MAX(output_x - (right_pad_num + left_pad_num), 0); in arm_convolve_1_x_n_s8_get_buffer_size_mve() 72 if (right_pad_num + no_pad_num + left_pad_num != output_x) in arm_convolve_1_x_n_s8_get_buffer_size_mve()
|
D | arm_convolve_s4.c | 76 const uint16_t output_x = output_dims->w; in arm_convolve_s4() local 108 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_convolve_s4() 192 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_convolve_s4() 326 output_data += (output_x * output_y * output_ch); in arm_convolve_s4()
|
D | arm_convolve_s16.c | 76 const int32_t output_x = output_dims->w; in arm_convolve_s16() local 107 for (int32_t i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_convolve_s16() 283 output_data += (output_x * output_y * output_ch); in arm_convolve_s16()
|
D | arm_depthwise_conv_s16.c | 60 const int32_t output_x, in depthwise_conv_s16_mult_4_s16() argument 67 …for (int32_t in_w = -pad_x, out_w = 0, ker_h_start = MAX(0, -in_h); out_w < output_x; in_w += stri… in depthwise_conv_s16_mult_4_s16() 150 const uint16_t output_x, in depthwise_conv_s16_generic_s16() argument 163 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in depthwise_conv_s16_generic_s16()
|
D | arm_depthwise_conv_s8.c | 64 const int32_t output_x, in depthwise_conv_s8_mult_4() argument 78 …for (int32_t in_w = -pad_x, out_w = 0, ker_h_start = MAX(0, -in_h); out_w < output_x; in_w += stri… in depthwise_conv_s8_mult_4() 172 const uint16_t output_x, in depthwise_conv_s8_generic() argument 191 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in depthwise_conv_s8_generic()
|
D | arm_convolve_s8.c | 76 const uint16_t output_x = output_dims->w; in arm_convolve_s8() local 132 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_convolve_s8() 337 output_data += (output_x * output_y * output_ch); in arm_convolve_s8()
|
D | arm_depthwise_conv_s8_opt.c | 88 const int32_t output_x = output_dims->w; in arm_depthwise_conv_s8_opt() local 115 … for (int i_out_x = 0, base_idx_x = -pad_x; i_out_x < output_x; base_idx_x += stride_x, i_out_x++) in arm_depthwise_conv_s8_opt() 223 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_depthwise_conv_s8_opt()
|
D | arm_depthwise_conv_fast_s16.c | 95 const int32_t output_x = output_dims->w; in arm_depthwise_conv_fast_s16() local 112 … for (int i_out_x = 0, base_idx_x = -pad_x; i_out_x < output_x; base_idx_x += stride_x, i_out_x++) in arm_depthwise_conv_fast_s16() 234 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_depthwise_conv_fast_s16()
|
D | arm_depthwise_conv_s4.c | 61 const int32_t output_x, in depthwise_conv_s4_generic() argument 83 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in depthwise_conv_s4_generic() 374 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in depthwise_conv_s4_generic()
|
D | arm_depthwise_conv_3x3_s8.c | 77 const int32_t output_x = output_dims->w; in arm_depthwise_conv_3x3_s8() local 97 …for (int32_t in_w = -pad_x, out_w = 0, ker_h_start = MAX(0, -in_h); out_w < output_x; in_w += stri… in arm_depthwise_conv_3x3_s8()
|
D | arm_depthwise_conv_s4_opt.c | 89 const int32_t output_x = output_dims->w; in arm_depthwise_conv_s4_opt() local 116 … for (int i_out_x = 0, base_idx_x = -pad_x; i_out_x < output_x; base_idx_x += stride_x, i_out_x++) in arm_depthwise_conv_s4_opt() 265 for (int i_out_x = 0; i_out_x < output_x; i_out_x++) in arm_depthwise_conv_s4_opt()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/Common/ |
D | conv2d_s4_weights_template.json | 71 output_x,
|
D | dw_s4_weights_template.json | 66 output_x,
|
/cmsis-nn-latest/Tests/UnitTest/ |
D | conv_settings.py | 264 output_x = math.ceil(float(self.x_input) / float(self.stride_x)) 270 …output_x = math.ceil(float(self.x_input - self.filter_x - dilation_filter_x + 1) / float(self.stri… 281 "output_x": output_x,
|