/cmsis-nn-latest/Source/ConvolutionFunctions/ |
D | arm_nn_mat_mult_kernel_s4_s16.c | 65 const int16_t *ip_b1 = ip_b0 + num_col_a; in arm_nn_mat_mult_kernel_s4_s16() local 95 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s4_s16() 108 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s4_s16() 129 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s4_s16() 140 b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s4_s16() 158 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s4_s16() 201 ip_b1 = ip_b0 + num_col_a; in arm_nn_mat_mult_kernel_s4_s16() 226 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s4_s16() 241 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s4_s16() 254 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s4_s16() [all …]
|
D | arm_nn_mat_mult_kernel_row_offset_s8_s16.c | 68 const int16_t *ip_b1 = ip_b0 + aligned_num_col_a; in arm_nn_mat_mult_kernel_row_offset_s8_s16() local 93 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_row_offset_s8_s16() 104 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_row_offset_s8_s16() 124 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_row_offset_s8_s16() 171 const int16_t *ip_b1 = ip_b0 + aligned_num_col_a; in arm_nn_mat_mult_kernel_row_offset_s8_s16() local 189 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_row_offset_s8_s16() 197 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_row_offset_s8_s16() 212 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_row_offset_s8_s16()
|
D | arm_nn_mat_mult_kernel_s8_s16.c | 65 const int16_t *ip_b1 = ip_b0 + aligned_num_col_a; in arm_nn_mat_mult_kernel_s8_s16() local 90 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s8_s16() 101 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s8_s16() 119 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s8_s16() 166 const int16_t *ip_b1 = ip_b0 + aligned_num_col_a; in arm_nn_mat_mult_kernel_s8_s16() local 184 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s8_s16() 192 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s8_s16() 206 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s8_s16()
|
D | arm_nn_mat_mult_kernel_s16.c | 77 const int16_t *ip_b1 = ip_b0 + num_col_a; in arm_nn_mat_mult_kernel_s16() local 96 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s16() 107 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s16() 126 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s16() 186 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s16() 244 const int16_t *ip_b1 = ip_b0 + num_col_a; in arm_nn_mat_mult_kernel_s16() local 255 int32_t b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s16() 263 b1 = arm_nn_read_q15x2_ia(&ip_b1); in arm_nn_mat_mult_kernel_s16() 277 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s16() 317 int16_t b1 = *ip_b1++; in arm_nn_mat_mult_kernel_s16()
|
D | arm_convolve_s16.c | 224 int32_t ip_b1, ip_b2; in arm_convolve_s16() 228 ip_b1 = arm_nn_read_q15x2_ia(&ip_as_col); in arm_convolve_s16() 229 sum = SMLAD(ker_a1, ip_b1, sum); in arm_convolve_s16() 245 int16_t ip_b1 = *ip_as_col++; in arm_convolve_s16() 246 sum += ker_a1 * ip_b1; in arm_convolve_s16()
|
D | arm_convolve_s8.c | 292 int32_t ip_b1, ip_b2; in arm_convolve_s8() 296 ip_b1 = arm_nn_read_q15x2_ia(&ip_as_col); in arm_convolve_s8() 297 sum = SMLAD(ker_a1, ip_b1, sum); in arm_convolve_s8() 312 int16_t ip_b1 = *ip_as_col++; in arm_convolve_s8() 314 sum += ker_a1 * ip_b1; in arm_convolve_s8()
|
D | arm_depthwise_conv_s8_opt.c | 298 int32_t ip_a1, ip_a2, ip_b1, ip_b2, op_a, op_b, op_c; in arm_depthwise_conv_s8_opt() local 300 ip_b1 = arm_nn_read_s8x4(row_pos); in arm_depthwise_conv_s8_opt() 305 ip_a2 = SXTB16(ip_b1); in arm_depthwise_conv_s8_opt() 306 ip_b1 = SXTB16(ROR(ip_b1, 8)); in arm_depthwise_conv_s8_opt() 316 op_b = PKHBT(ip_b1, ip_a1, 16); in arm_depthwise_conv_s8_opt() 327 op_b = PKHTB(ip_a1, ip_b1, 16); in arm_depthwise_conv_s8_opt()
|
D | arm_depthwise_conv_s4_opt.c | 348 int32_t ip_a1, ip_a2, ip_b1, ip_b2, op_a, op_b, op_c; in arm_depthwise_conv_s4_opt() local 351 read_and_pad_s4(row_pos, &ip_a2, &ip_b1); in arm_depthwise_conv_s4_opt() 362 op_b = PKHBT(ip_b1, ip_a1, 16); in arm_depthwise_conv_s4_opt() 374 op_b = PKHTB(ip_a1, ip_b1, 16); in arm_depthwise_conv_s4_opt() 548 int32_t ip_a1, ip_a2, ip_b1, ip_b2, op_a, op_b, op_c; in arm_depthwise_conv_s4_opt() local 551 read_and_pad_s4(row_pos, &ip_a2, &ip_b1); in arm_depthwise_conv_s4_opt() 562 op_b = PKHBT(ip_b1, ip_a1, 16); in arm_depthwise_conv_s4_opt() 574 op_b = PKHTB(ip_a1, ip_b1, 16); in arm_depthwise_conv_s4_opt()
|
D | arm_convolve_s4.c | 275 int32_t ip_b1, ip_b2; in arm_convolve_s4() 279 ip_b1 = arm_nn_read_q15x2_ia(&ip_as_col); in arm_convolve_s4() 280 sum = SMLAD(ker_a1, ip_b1, sum); in arm_convolve_s4()
|