Searched refs:out_buff (Results 1 – 3 of 3) sorted by relevance
/cmsis-nn-latest/Source/ConvolutionFunctions/ |
D | arm_depthwise_conv_s8.c | 88 int32_t out_buff[4] = {0, 0, 0, 0}; in depthwise_conv_s8_mult_4() local 91 out_buff[0] = *bias++; in depthwise_conv_s8_mult_4() 92 out_buff[1] = *bias++; in depthwise_conv_s8_mult_4() 93 out_buff[2] = *bias++; in depthwise_conv_s8_mult_4() 94 out_buff[3] = *bias++; in depthwise_conv_s8_mult_4() 109 out_buff[0] += in_val * kernel[0]; in depthwise_conv_s8_mult_4() 110 out_buff[1] += in_val * kernel[1]; in depthwise_conv_s8_mult_4() 111 out_buff[2] += in_val * kernel[2]; in depthwise_conv_s8_mult_4() 112 out_buff[3] += in_val * kernel[3]; in depthwise_conv_s8_mult_4() 116 int32x4_t res = vldrwq_s32(out_buff); in depthwise_conv_s8_mult_4() [all …]
|
D | arm_depthwise_conv_s16.c | 79 int64_t out_buff[4] = {0, 0, 0, 0}; in depthwise_conv_s16_mult_4_s16() local 83 out_buff[0] = bias[out_ch + 0 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 84 out_buff[1] = bias[out_ch + 1 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 85 out_buff[2] = bias[out_ch + 2 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 86 out_buff[3] = bias[out_ch + 3 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 102 out_buff[0] += in_val * kernel[ker_idx + 0 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 103 out_buff[1] += in_val * kernel[ker_idx + 1 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 104 out_buff[2] += in_val * kernel[ker_idx + 2 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 105 out_buff[3] += in_val * kernel[ker_idx + 3 + mult_tile]; in depthwise_conv_s16_mult_4_s16() 110 … arm_nn_requantize_s64(out_buff[0], out_buff32[0], output_shift[out_ch + 0 + mult_tile]); in depthwise_conv_s16_mult_4_s16() [all …]
|
D | arm_depthwise_conv_3x3_s8.c | 241 int32_t out_buff = 0; in arm_depthwise_conv_3x3_s8() local 244 out_buff = *bias++; in arm_depthwise_conv_3x3_s8() 254 out_buff += (*(input_ptr) + input_offset) * *(kernel_ptr); in arm_depthwise_conv_3x3_s8() 257 out_buff += (*(input_ptr + input_ch) + input_offset) * *(kernel_ptr + input_ch); in arm_depthwise_conv_3x3_s8() 261 … out_buff += (*(input_ptr + (input_ch << 1)) + input_offset) * *(kernel_ptr + (input_ch << 1)); in arm_depthwise_conv_3x3_s8() 268 out_buff = arm_nn_requantize(out_buff, output_mult[in_ch], output_shift[in_ch]); in arm_depthwise_conv_3x3_s8() 269 out_buff += output_offset; in arm_depthwise_conv_3x3_s8() 270 out_buff = MIN(MAX(out_buff, output_activation_min), output_activation_max); in arm_depthwise_conv_3x3_s8() 271 output[out_idx++] = (int8_t)out_buff; in arm_depthwise_conv_3x3_s8()
|