/cmsis-nn-3.6.0-3.5.0/Source/NNSupportFunctions/ |
D | arm_q7_to_q15_with_offset.c | 42 void arm_q7_to_q15_with_offset(const int8_t *src, int16_t *dst, int32_t block_size, int16_t offset) in arm_q7_to_q15_with_offset() argument 56 vstrhq_s16(dst, source); in arm_q7_to_q15_with_offset() 57 dst += 8; in arm_q7_to_q15_with_offset() 89 arm_nn_write_q15x2_ia(&dst, out_q15x2_1); in arm_q7_to_q15_with_offset() 90 arm_nn_write_q15x2_ia(&dst, out_q15x2_2); in arm_q7_to_q15_with_offset() 105 *dst++ = (int16_t)*src++ + offset; in arm_q7_to_q15_with_offset()
|
D | arm_s8_to_s16_unordered_with_offset.c | 42 void arm_s8_to_s16_unordered_with_offset(const int8_t *src, int16_t *dst, int32_t block_size, int16… in arm_s8_to_s16_unordered_with_offset() argument 58 arm_nn_write_q15x2_ia(&dst, in_s16x2_1); in arm_s8_to_s16_unordered_with_offset() 59 arm_nn_write_q15x2_ia(&dst, in_s16x2_2); in arm_s8_to_s16_unordered_with_offset() 68 *dst++ = (int16_t)*src++ + offset; in arm_s8_to_s16_unordered_with_offset()
|
D | arm_nn_vec_mat_mul_result_acc_s8.c | 48 int16_t *dst, in arm_nn_vec_mat_mul_result_acc_s8() argument 114 acc = vaddq_s32(acc, vldrhq_s32(dst)); in arm_nn_vec_mat_mul_result_acc_s8() 119 vstrhq_s32(dst, acc); in arm_nn_vec_mat_mul_result_acc_s8() 120 dst += 4; in arm_nn_vec_mat_mul_result_acc_s8() 149 acc_0 += dst_offset + *dst; in arm_nn_vec_mat_mul_result_acc_s8() 153 *dst++ = (int16_t)acc_0; in arm_nn_vec_mat_mul_result_acc_s8() 207 acc_0 += dst_offset + *dst; in arm_nn_vec_mat_mul_result_acc_s8() 208 acc_1 += dst_offset + dst[1]; in arm_nn_vec_mat_mul_result_acc_s8() 213 *dst++ = (int16_t)acc_0; in arm_nn_vec_mat_mul_result_acc_s8() 214 *dst++ = (int16_t)acc_1; in arm_nn_vec_mat_mul_result_acc_s8() [all …]
|
D | arm_nn_vec_mat_mult_t_s8.c | 61 int8_t *dst, in arm_nn_vec_mat_mult_t_s8() argument 139 vstrbq_scatter_offset_p_s32(dst, address_offset_array, acc, p); in arm_nn_vec_mat_mult_t_s8() 143 vstrbq_p_s32(dst, acc, p); in arm_nn_vec_mat_mult_t_s8() 145 dst += 3 * address_offset; in arm_nn_vec_mat_mult_t_s8() 185 *dst = MIN(acc_0, activation_max); in arm_nn_vec_mat_mult_t_s8() 186 dst += address_offset; in arm_nn_vec_mat_mult_t_s8() 254 *dst = (int8_t)acc_0; in arm_nn_vec_mat_mult_t_s8() 255 *(dst + address_offset) = (int8_t)acc_1; in arm_nn_vec_mat_mult_t_s8() 256 dst += 2 * address_offset; in arm_nn_vec_mat_mult_t_s8() 300 *dst = (int8_t)acc_0; in arm_nn_vec_mat_mult_t_s8() [all …]
|
D | arm_nn_vec_mat_mult_t_svdf_s8.c | 51 int16_t *dst, in arm_nn_vec_mat_mult_t_svdf_s8() argument 121 *(dst) = (int16_t)acc[0]; in arm_nn_vec_mat_mult_t_svdf_s8() 122 *(dst + dst_offset) = (int16_t)acc[1]; in arm_nn_vec_mat_mult_t_svdf_s8() 123 *(dst + 2 * dst_offset) = (int16_t)acc[2]; in arm_nn_vec_mat_mult_t_svdf_s8() 124 dst += 3 * dst_offset; in arm_nn_vec_mat_mult_t_svdf_s8() 158 *dst = (int16_t)MIN(acc_0, activation_max); in arm_nn_vec_mat_mult_t_svdf_s8() 159 dst += dst_offset; in arm_nn_vec_mat_mult_t_svdf_s8() 294 *dst = (int16_t)acc_0; in arm_nn_vec_mat_mult_t_svdf_s8() 295 *(dst + dst_offset) = (int16_t)acc_1; in arm_nn_vec_mat_mult_t_svdf_s8() 296 dst += 2 * dst_offset; in arm_nn_vec_mat_mult_t_svdf_s8() [all …]
|
D | arm_nn_vec_mat_mult_t_s16.c | 53 int16_t *dst, in arm_nn_vec_mat_mult_t_s16() argument 144 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 150 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 156 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 162 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 213 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 278 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 283 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 325 *dst++ = (int16_t)tmp; in arm_nn_vec_mat_mult_t_s16() 359 *dst++ = (int16_t)result; in arm_nn_vec_mat_mult_t_s16()
|
D | arm_nn_mat_mult_nt_t_s8.c | 51 int8_t *dst, in arm_nn_mat_mult_nt_t_s8() argument 144 vstrbq_scatter_offset_s32(dst, scatter_offset, res); in arm_nn_mat_mult_nt_t_s8() 145 dst++; in arm_nn_mat_mult_nt_t_s8() 148 dst += (3 * rhs_rows); in arm_nn_mat_mult_nt_t_s8() 205 vstrbq_s32(dst, res); in arm_nn_mat_mult_nt_t_s8() 206 dst += 4; in arm_nn_mat_mult_nt_t_s8() 218 *dst++ = (int8_t)acc_n0; in arm_nn_mat_mult_nt_t_s8() 229 int8_t *dst_ptr = &dst[0]; in arm_nn_mat_mult_nt_t_s8() 576 dst += 2; in arm_nn_mat_mult_nt_t_s8() 582 int8_t *dst_ptr = &dst[0]; in arm_nn_mat_mult_nt_t_s8() [all …]
|
/cmsis-nn-3.6.0-3.5.0/Source/PoolingFunctions/ |
D | arm_max_pool_s8.c | 50 int8_t *dst = base; in compare_and_replace_if_larger_q7() 58 ref_max.word = arm_nn_read_s8x4(dst); in compare_and_replace_if_larger_q7() 78 arm_nn_write_s8x4_ia(&dst, ref_max.word); in compare_and_replace_if_larger_q7() 86 if (*src > *dst) in compare_and_replace_if_larger_q7() 88 *dst = *src; in compare_and_replace_if_larger_q7() 90 dst++; in compare_and_replace_if_larger_q7() 169 int8_t *dst) in arm_max_pool_s8() argument 185 int8_t *dst_base = dst; in arm_max_pool_s8() 209 arm_memcpy_s8(dst, start, channel_in); in arm_max_pool_s8() 214 compare_and_replace_if_larger_q7(dst, start, channel_in); in arm_max_pool_s8() [all …]
|
D | arm_max_pool_s16.c | 50 int16_t *dst = base; in compare_and_replace_if_larger() 58 ref_max.word = arm_nn_read_s16x2(dst); in compare_and_replace_if_larger() 70 arm_nn_write_q15x2_ia(&dst, ref_max.word); in compare_and_replace_if_larger() 77 if (*src > *dst) in compare_and_replace_if_larger() 79 *dst = *src; in compare_and_replace_if_larger() 151 int16_t *dst) in arm_max_pool_s16() argument 167 int16_t *dst_base = dst; in arm_max_pool_s16() 191 memcpy(dst, start, channel_in * sizeof(int16_t)); in arm_max_pool_s16() 196 compare_and_replace_if_larger(dst, start, channel_in); in arm_max_pool_s16() 201 dst += channel_in; in arm_max_pool_s16()
|
D | arm_avgpool_s16.c | 79 int16_t *dst) in arm_avgpool_s16() argument 107 int16_t *out = &dst[ch_src * (i_x + i_y * output_x)]; in arm_avgpool_s16() 238 scale_q31_to_q15_and_clamp(buffer, dst, ch_src, count, act_min, act_max); in arm_avgpool_s16() 239 dst += ch_src; in arm_avgpool_s16() 285 dst[i_ch_in + ch_src * (i_x + i_y * output_x)] = sum; in arm_avgpool_s16()
|
D | arm_avgpool_s8.c | 80 int8_t *dst) in arm_avgpool_s8() argument 108 int8_t *out = &dst[ch_src * (i_x + i_y * output_x)]; in arm_avgpool_s8() 226 int8_t *dst) in arm_avgpool_s8() argument 298 scale_q31_to_q7_and_clamp(buffer, dst, ch_src, count, act_min, act_max); in arm_avgpool_s8() 299 dst += ch_src; in arm_avgpool_s8() 338 dst[i_ch_in + ch_src * (i_x + i_y * output_x)] = sum; in arm_avgpool_s8()
|
/cmsis-nn-3.6.0-3.5.0/Include/ |
D | arm_nnsupportfunctions.h | 137 void arm_q7_to_q15_with_offset(const int8_t *src, int16_t *dst, int32_t block_size, int16_t offset); 162 void arm_s8_to_s16_unordered_with_offset(const int8_t *src, int16_t *dst, int32_t block_size, int16… 361 int8_t *dst, 398 int8_t *dst, 429 int16_t *dst, 459 int16_t *dst, 665 __STATIC_FORCEINLINE void arm_memset_s8(int8_t *dst, const int8_t val, uint32_t block_size) in arm_memset_s8() argument 674 : [in] "+r"(dst) in arm_memset_s8() 678 memset(dst, val, block_size); in arm_memset_s8() 951 __STATIC_FORCEINLINE void arm_memcpy_s8(int8_t *__RESTRICT dst, const int8_t *__RESTRICT src, uint3… in arm_memcpy_s8() argument [all …]
|
D | arm_nnfunctions.h | 1539 int16_t *dst);
|