/cmsis-nn-latest/Source/ConvolutionFunctions/ |
D | arm_depthwise_conv_3x3_s8.c | 80 const int32_t input_offset = dw_conv_params->input_offset; in arm_depthwise_conv_3x3_s8() local 120 const uint32_t lhs_offset_s16x2 = PKHBT(input_offset, input_offset, 16); in arm_depthwise_conv_3x3_s8() 187 out_buff0 += ((int8_t)in_val + input_offset) * (int8_t)ker_val; in arm_depthwise_conv_3x3_s8() 188 … out_buff1 += ((int8_t)(in_val >> 8) + input_offset) * (int8_t)(ker_val >> 8); in arm_depthwise_conv_3x3_s8() 189 … out_buff2 += ((int8_t)(in_val >> 16) + input_offset) * (int8_t)(ker_val >> 16); in arm_depthwise_conv_3x3_s8() 190 … out_buff3 += ((int8_t)(in_val >> 24) + input_offset) * (int8_t)(ker_val >> 24); in arm_depthwise_conv_3x3_s8() 196 out_buff0 += ((int8_t)in_val + input_offset) * (int8_t)ker_val; in arm_depthwise_conv_3x3_s8() 197 out_buff1 += ((int8_t)(in_val >> 8) + input_offset) * (int8_t)(ker_val >> 8); in arm_depthwise_conv_3x3_s8() 198 out_buff2 += ((int8_t)(in_val >> 16) + input_offset) * (int8_t)(ker_val >> 16); in arm_depthwise_conv_3x3_s8() 199 out_buff3 += ((int8_t)(in_val >> 24) + input_offset) * (int8_t)(ker_val >> 24); in arm_depthwise_conv_3x3_s8() [all …]
|
D | arm_convolve_even_s4.c | 92 const int32_t input_offset = conv_params->input_offset; in arm_convolve_even_s4() local 131 … arm_memset_s8(im2col_buf, (int8_t)-input_offset, sizeof(int8_t) * input_ch); in arm_convolve_even_s4() 168 input_offset, in arm_convolve_even_s4() 194 input_offset, in arm_convolve_even_s4()
|
D | arm_convolve_1_x_n_s8.c | 124 …arm_memset_s8(im2col, (int8_t)-conv_params->input_offset, sizeof(int8_t) * (uint32_t)pad_size_left… in arm_convolve_1_x_n_s8() 137 conv_params->input_offset, in arm_convolve_1_x_n_s8() 167 conv_params->input_offset, in arm_convolve_1_x_n_s8() 190 …arm_memset_s8(im2col, (int8_t)-conv_params->input_offset, sizeof(int8_t) * (uint32_t)pad_size_righ… in arm_convolve_1_x_n_s8() 201 conv_params->input_offset, in arm_convolve_1_x_n_s8()
|
D | arm_convolve_s8.c | 90 const int32_t input_offset = conv_params->input_offset; in arm_convolve_s8() local 156 … im2col_buf, (int8_t)-input_offset, sizeof(int8_t) * kernel_ch * kernel_x * kernel_y); in arm_convolve_s8() 198 … arm_memset_s8(im2col_buf, (int8_t)-input_offset, sizeof(int8_t) * kernel_ch); in arm_convolve_s8() 227 input_offset, in arm_convolve_s8() 243 … im2col_buf - rhs_cols, im2col_buf_start_s16, rhs_cols, (int16_t)input_offset); in arm_convolve_s8() 247 … im2col_buf - rhs_cols, im2col_buf_start_s16, rhs_cols, (int16_t)input_offset); in arm_convolve_s8() 313 input_offset, in arm_convolve_s8()
|
D | arm_convolve_s4.c | 90 const int32_t input_offset = conv_params->input_offset; in arm_convolve_s4() local 122 … arm_memset_s8(im2col_buf, (int8_t)-input_offset, sizeof(int8_t) * input_ch); in arm_convolve_s4() 145 input_offset, in arm_convolve_s4() 170 input_offset, in arm_convolve_s4() 208 … input_data + (k_y * input_x + k_x) * input_ch, two_column_buf, input_ch, input_offset); in arm_convolve_s4()
|
D | arm_depthwise_conv_s8.c | 67 const int32_t input_offset, in depthwise_conv_s8_mult_4() argument 108 int32_t in_val = input[in_idx + ker_w * input_ch] + input_offset; in depthwise_conv_s8_mult_4() 175 const int32_t input_offset, in depthwise_conv_s8_generic() argument 246 acc_0 += (input[idx_0] + input_offset) * kernel[ker_idx_0]; in depthwise_conv_s8_generic() 314 dw_conv_params->input_offset, in arm_depthwise_conv_s8() 341 dw_conv_params->input_offset, in arm_depthwise_conv_s8()
|
D | arm_convolve_1x1_s4_fast.c | 85 conv_params->input_offset, in arm_convolve_1x1_s4_fast()
|
D | arm_depthwise_conv_s4.c | 64 const int32_t input_offset, in depthwise_conv_s4_generic() argument 150 acc_0 += (input[idx_0] + input_offset) * ker_val0; in depthwise_conv_s4_generic() 151 acc_1 += (input[idx_0 + 1] + input_offset) * ker_val1; in depthwise_conv_s4_generic() 248 acc_0 += (input[idx_0] + input_offset) * ker_val0; in depthwise_conv_s4_generic() 335 acc_0 += (input[idx_0] + input_offset) * ker_val0; in depthwise_conv_s4_generic() 336 acc_1 += (input[idx_0] + input_offset) * ker_val1; in depthwise_conv_s4_generic() 454 acc_0 += (input[idx_0] + input_offset) * ker_val; in depthwise_conv_s4_generic() 530 dw_conv_params->input_offset, in arm_depthwise_conv_s4()
|
D | arm_transpose_conv_wrapper_s8.c | 96 conv_params.input_offset = transpose_conv_params->input_offset; in arm_transpose_conv_wrapper_s8()
|
D | arm_depthwise_conv_s8_opt.c | 91 const int32_t input_offset = dw_conv_params->input_offset; in arm_depthwise_conv_s8_opt() local 123 arm_memset_s8(lhs_buffer, (int8_t)-input_offset, (uint32_t)active_ch); in arm_depthwise_conv_s8_opt() 143 input_offset, in arm_depthwise_conv_s8_opt() 184 ip_0 = vaddq_n_s32(ip_0, input_offset); in arm_depthwise_conv_s8_opt() 256 (int16_t)input_offset); in arm_depthwise_conv_s8_opt()
|
/cmsis-nn-latest/Include/ |
D | arm_nn_types.h | 135 int32_t input_offset; /**< The negative of the zero value for the input tensor */ member 146 int32_t input_offset; /**< The negative of the zero value for the input tensor */ member 158 int32_t input_offset; /**< The negative of the zero value for the input tensor */ member 178 int32_t input_offset; /**< The negative of the zero value for the input tensor */ member 203 int32_t input_offset; /**< The negative of the zero value for the input tensor */ member 250 int32_t input_offset; member
|
/cmsis-nn-latest/Source/NNSupportFunctions/ |
D | arm_nn_depthwise_conv_nt_t_padded_s8.c | 58 const int32_t input_offset, in arm_nn_depthwise_conv_nt_t_padded_s8() argument 99 ip_0 = vaddq_n_s32(ip_0, input_offset); in arm_nn_depthwise_conv_nt_t_padded_s8() 103 ip_1 = vaddq_n_s32(ip_1, input_offset); in arm_nn_depthwise_conv_nt_t_padded_s8() 107 ip_2 = vaddq_n_s32(ip_2, input_offset); in arm_nn_depthwise_conv_nt_t_padded_s8() 111 ip_3 = vaddq_n_s32(ip_3, input_offset); in arm_nn_depthwise_conv_nt_t_padded_s8() 159 (void)input_offset; in arm_nn_depthwise_conv_nt_t_padded_s8()
|
D | arm_nn_depthwise_conv_nt_t_s8.c | 49 const int32_t input_offset, in arm_nn_depthwise_conv_nt_t_s8() argument 111 ker_sum = vmulq_n_s32(ker_sum, input_offset); in arm_nn_depthwise_conv_nt_t_s8() 152 (void)input_offset; in arm_nn_depthwise_conv_nt_t_s8()
|
D | arm_nn_depthwise_conv_nt_t_s4.c | 51 const int32_t input_offset, in arm_nn_depthwise_conv_nt_t_s4() argument 169 ker_sum = vmulq_n_s32(ker_sum, input_offset); in arm_nn_depthwise_conv_nt_t_s4() 210 (void)input_offset; in arm_nn_depthwise_conv_nt_t_s4()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_ds_cnn_s_s8/ |
D | test_arm_ds_cnn_s_s8.c | 80 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_2_INPUT_OFFSET; in ds_cnn_s_s8_get_buffer_size() 141 conv_params.input_offset = CONV_2D_1_INPUT_OFFSET; in ds_cnn_s_s8_inference() 192 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_2_INPUT_OFFSET; in ds_cnn_s_s8_inference() 236 conv_params.input_offset = CONV_2D_3_INPUT_OFFSET; in ds_cnn_s_s8_inference() 256 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_4_INPUT_OFFSET; in ds_cnn_s_s8_inference() 275 conv_params.input_offset = CONV_2D_5_INPUT_OFFSET; in ds_cnn_s_s8_inference() 295 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_6_INPUT_OFFSET; in ds_cnn_s_s8_inference() 314 conv_params.input_offset = CONV_2D_7_INPUT_OFFSET; in ds_cnn_s_s8_inference() 333 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_8_INPUT_OFFSET; in ds_cnn_s_s8_inference() 351 conv_params.input_offset = CONV_2D_9_INPUT_OFFSET; in ds_cnn_s_s8_inference() [all …]
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_ds_cnn_l_s8/ |
D | test_arm_ds_cnn_l_s8.c | 79 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_2_INPUT_OFFSET; in ds_cnn_l_s8_get_buffer_size() 158 conv_params.input_offset = CONV_2D_1_INPUT_OFFSET; in ds_cnn_l_s8_inference() 202 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_2_INPUT_OFFSET; in ds_cnn_l_s8_inference() 250 conv_params.input_offset = CONV_2D_3_INPUT_OFFSET; in ds_cnn_l_s8_inference() 276 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_4_INPUT_OFFSET; in ds_cnn_l_s8_inference() 295 conv_params.input_offset = CONV_2D_5_INPUT_OFFSET; in ds_cnn_l_s8_inference() 315 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_6_INPUT_OFFSET; in ds_cnn_l_s8_inference() 334 conv_params.input_offset = CONV_2D_7_INPUT_OFFSET; in ds_cnn_l_s8_inference() 353 dw_conv_params.input_offset = DEPTHWISE_CONV_2D_8_INPUT_OFFSET; in ds_cnn_l_s8_inference() 371 conv_params.input_offset = CONV_2D_9_INPUT_OFFSET; in ds_cnn_l_s8_inference() [all …]
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_fully_connected_s8/ |
D | test_arm_fully_connected_s8.c | 60 fc_params.input_offset = FULLY_CONNECTED_INPUT_OFFSET; in fully_connected_arm_fully_connected_s8() 80 fc_params.input_offset, in fully_connected_arm_fully_connected_s8() 135 fc_params.input_offset = FULLY_CONNECTED_W_ZP_INPUT_OFFSET; in fully_connected_w_zp_arm_fully_connected_s8() 155 fc_params.input_offset, in fully_connected_w_zp_arm_fully_connected_s8() 206 fc_params.input_offset = FULLY_CONNECTED_MVE_0_INPUT_OFFSET; in fully_connected_mve_0_arm_fully_connected_s8() 225 fc_params.input_offset, in fully_connected_mve_0_arm_fully_connected_s8() 275 fc_params.input_offset = FULLY_CONNECTED_MVE_1_INPUT_OFFSET; in fully_connected_mve_1_arm_fully_connected_s8() 294 fc_params.input_offset, in fully_connected_mve_1_arm_fully_connected_s8() 344 fc_params.input_offset = FULLY_CONNECTED_NULL_BIAS_0_INPUT_OFFSET; in fully_connected_null_bias_0_arm_fully_connected_s8() 374 fc_params.input_offset, in fully_connected_null_bias_0_arm_fully_connected_s8() [all …]
|
/cmsis-nn-latest/Source/FullyConnectedFunctions/ |
D | arm_batch_matmul_s8.c | 88 bmm_params->fc_params.input_offset, in arm_batch_matmul_s8() 103 bmm_params->fc_params.input_offset, in arm_batch_matmul_s8()
|
D | arm_fully_connected_s4.c | 75 fc_params->input_offset, in arm_fully_connected_s4()
|
D | arm_fully_connected_per_channel_s8.c | 82 fc_params->input_offset, in arm_fully_connected_per_channel_s8()
|
D | arm_fully_connected_s8.c | 83 fc_params->input_offset, in arm_fully_connected_s8()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_fully_connected_s4/ |
D | test_arm_fully_connected_s4.c | 60 fc_params.input_offset = FULLY_CONNECTED_INT4_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4() 123 fc_params.input_offset = FULLY_CONNECTED_INT4_2_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4_2() 186 fc_params.input_offset = FULLY_CONNECTED_INT4_3_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4_3() 249 fc_params.input_offset = FULLY_CONNECTED_INT4_4_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4_4() 312 fc_params.input_offset = FULLY_CONNECTED_INT4_5_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4_5() 375 fc_params.input_offset = FULLY_CONNECTED_INT4_6_INPUT_OFFSET; in fully_connected_int4_arm_fully_connected_s4_6()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_convolve_1x1_s4_fast/ |
D | test_arm_convolve_1x1_s4_fast.c | 73 conv_params.input_offset = KERNEL1X1_INT4_INPUT_OFFSET; in kernel1x1_arm_convolve_1x1_s4_fast() 147 conv_params.input_offset = KERNEL1X1_INT4_2_INPUT_OFFSET; in kernel1x1_2_arm_convolve_1x1_s4_fast() 220 conv_params.input_offset = KERNEL1X1_INT4_3_INPUT_OFFSET; in kernel1x1_3_arm_convolve_1x1_s4_fast() 296 conv_params.input_offset = KERNEL1X1_STRIDE_X_INT4_INPUT_OFFSET; in kernel1x1_stride_x_arm_convolve_1x1_s4() 386 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_INT4_INPUT_OFFSET; in kernel1x1_stride_x_y_arm_convolve_1x1_s4() 479 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_1_INT4_INPUT_OFFSET; in kernel1x1_stride_x_y_1_arm_convolve_1x1_s4() 548 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INT4_INPUT_OFFSET; in kernel1x1_stride_x_y_2_arm_convolve_1x1_s4() 598 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INT4_INPUT_OFFSET; in buffer_size_arm_convolve_1x1_s4_fast() 635 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INT4_INPUT_OFFSET; in buffer_size_mve_arm_convolve_1x1_s4_fast() 674 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INT4_INPUT_OFFSET; in buffer_size_dsp_arm_convolve_1x1_s4_fast()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_fully_connected_s16/ |
D | test_arm_fully_connected_s16.c | 58 fc_params.input_offset = 0; in fully_connected_int16_arm_fully_connected_s16() 123 fc_params.input_offset = 0; in fully_connected_int16_big_arm_fully_connected_s16() 187 fc_params.input_offset = 0; in fc_int16_slow_arm_fully_connected_s16()
|
/cmsis-nn-latest/Tests/UnitTest/TestCases/test_arm_convolve_1x1_s8_fast/ |
D | test_arm_convolve_1x1_s8_fast.c | 69 conv_params.input_offset = KERNEL1X1_INPUT_OFFSET; in kernel1x1_arm_convolve_1x1_s8_fast() 143 conv_params.input_offset = KERNEL1X1_STRIDE_X_INPUT_OFFSET; in kernel1x1_stride_x_arm_convolve_1x1_s8() 231 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_INPUT_OFFSET; in kernel1x1_stride_x_y_arm_convolve_1x1_s8() 322 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_1_INPUT_OFFSET; in kernel1x1_stride_x_y_1_arm_convolve_1x1_s8() 389 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INPUT_OFFSET; in kernel1x1_stride_x_y_2_arm_convolve_1x1_s8() 439 conv_params.input_offset = KERNEL1X1_INPUT_OFFSET; in buffer_size_arm_convolve_1x1_s8_fast() 479 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INPUT_OFFSET; in buffer_size_mve_arm_convolve_1x1_s8_fast() 518 conv_params.input_offset = KERNEL1X1_STRIDE_X_Y_2_INPUT_OFFSET; in buffer_size_dsp_arm_convolve_1x1_s8_fast()
|