Home
last modified time | relevance | path

Searched refs:col_pos (Results 1 – 3 of 3) sorted by relevance

/cmsis-nn-latest/Source/ConvolutionFunctions/
Darm_depthwise_conv_s4_opt.c336 int16_t *col_pos = col_buffer_start + col_shift; in arm_depthwise_conv_s4_opt() local
354 op_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_s4_opt()
355 op_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_s4_opt()
366 op_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_s4_opt()
367 op_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_s4_opt()
387 sum += ker0 * col_pos[0]; in arm_depthwise_conv_s4_opt()
388 sum_2 += ker1 * col_pos[1]; in arm_depthwise_conv_s4_opt()
389 sum_3 += ker2 * col_pos[2]; in arm_depthwise_conv_s4_opt()
390 sum_4 += ker3 * col_pos[3]; in arm_depthwise_conv_s4_opt()
398 sum += ker0 * col_pos[0 + input_ch]; in arm_depthwise_conv_s4_opt()
[all …]
Darm_depthwise_conv_s8_opt.c289 int16_t *col_pos = col_buffer_start + row_shift; in arm_depthwise_conv_s8_opt() local
302 op_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_s8_opt()
303 op_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_s8_opt()
319 op_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_s8_opt()
320 op_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_s8_opt()
331 col_pos += input_ch << 1; in arm_depthwise_conv_s8_opt()
338 sum += row_pos[0] * col_pos[0]; in arm_depthwise_conv_s8_opt()
339 sum_2 += row_pos[1] * col_pos[1]; in arm_depthwise_conv_s8_opt()
340 sum_3 += row_pos[2] * col_pos[2]; in arm_depthwise_conv_s8_opt()
341 sum_4 += row_pos[3] * col_pos[3]; in arm_depthwise_conv_s8_opt()
[all …]
Darm_depthwise_conv_fast_s16.c299 int16_t *col_pos = col_buffer_start + row_shift; in arm_depthwise_conv_fast_s16() local
312 col_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_fast_s16()
313 col_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_fast_s16()
329 col_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_fast_s16()
330 col_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_fast_s16()
341 col_pos += input_ch << 1; in arm_depthwise_conv_fast_s16()
348 sum_1 += row_pos[0] * col_pos[0]; in arm_depthwise_conv_fast_s16()
349 sum_2 += row_pos[1] * col_pos[1]; in arm_depthwise_conv_fast_s16()
350 sum_3 += row_pos[2] * col_pos[2]; in arm_depthwise_conv_fast_s16()
351 sum_4 += row_pos[3] * col_pos[3]; in arm_depthwise_conv_fast_s16()
[all …]