Searched refs:col_pos (Results 1 – 3 of 3) sorted by relevance
336 int16_t *col_pos = col_buffer_start + col_shift; in arm_depthwise_conv_s4_opt() local354 op_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_s4_opt()355 op_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_s4_opt()366 op_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_s4_opt()367 op_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_s4_opt()387 sum += ker0 * col_pos[0]; in arm_depthwise_conv_s4_opt()388 sum_2 += ker1 * col_pos[1]; in arm_depthwise_conv_s4_opt()389 sum_3 += ker2 * col_pos[2]; in arm_depthwise_conv_s4_opt()390 sum_4 += ker3 * col_pos[3]; in arm_depthwise_conv_s4_opt()398 sum += ker0 * col_pos[0 + input_ch]; in arm_depthwise_conv_s4_opt()[all …]
289 int16_t *col_pos = col_buffer_start + row_shift; in arm_depthwise_conv_s8_opt() local302 op_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_s8_opt()303 op_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_s8_opt()319 op_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_s8_opt()320 op_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_s8_opt()331 col_pos += input_ch << 1; in arm_depthwise_conv_s8_opt()338 sum += row_pos[0] * col_pos[0]; in arm_depthwise_conv_s8_opt()339 sum_2 += row_pos[1] * col_pos[1]; in arm_depthwise_conv_s8_opt()340 sum_3 += row_pos[2] * col_pos[2]; in arm_depthwise_conv_s8_opt()341 sum_4 += row_pos[3] * col_pos[3]; in arm_depthwise_conv_s8_opt()[all …]
299 int16_t *col_pos = col_buffer_start + row_shift; in arm_depthwise_conv_fast_s16() local312 col_a = arm_nn_read_s16x2(col_pos); in arm_depthwise_conv_fast_s16()313 col_b = arm_nn_read_s16x2(col_pos + input_ch); in arm_depthwise_conv_fast_s16()329 col_a = arm_nn_read_s16x2(col_pos + 2); in arm_depthwise_conv_fast_s16()330 col_b = arm_nn_read_s16x2(col_pos + input_ch + 2); in arm_depthwise_conv_fast_s16()341 col_pos += input_ch << 1; in arm_depthwise_conv_fast_s16()348 sum_1 += row_pos[0] * col_pos[0]; in arm_depthwise_conv_fast_s16()349 sum_2 += row_pos[1] * col_pos[1]; in arm_depthwise_conv_fast_s16()350 sum_3 += row_pos[2] * col_pos[2]; in arm_depthwise_conv_fast_s16()351 sum_4 += row_pos[3] * col_pos[3]; in arm_depthwise_conv_fast_s16()[all …]