/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Include/ |
D | arm_nnfunctions.h | 198 const q7_t *input_data, 200 const q7_t *filter_data, 204 q7_t *output_data); 256 const q7_t *input_data, 258 const q7_t *filter_data, 262 q7_t *output_data); 295 arm_status arm_convolve_HWC_q7_basic(const q7_t *Im_in, 298 const q7_t *wt, 303 const q7_t *bias, 306 q7_t *Im_out, [all …]
|
D | arm_nnsupportfunctions.h | 59 q7_t bytes[4]; 92 void arm_q7_to_q15_no_shift(const q7_t *pSrc, q15_t *pDst, uint32_t blockSize); 110 void arm_nn_add_q7(const q7_t *input, q31_t *output, uint32_t block_size); 120 void arm_q7_to_q15_reordered_no_shift(const q7_t *pSrc, q15_t *pDst, uint32_t blockSize); 138 void arm_q7_to_q15_with_offset(const q7_t *src, q15_t *dst, uint32_t block_size, q15_t offset); 153 void arm_q7_to_q15_reordered_with_offset(const q7_t *src, q15_t *dst, uint32_t block_size, q15_t of… 170 void arm_nn_accumulate_q7_to_q15(q15_t *dst, const q7_t *src, uint32_t block_size); 191 q7_t *arm_nn_depthwise_conv_s8_core(const q7_t *row, 201 q7_t *out); 225 q7_t *arm_nn_mat_mult_s8(const q7_t *input_row, [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/MatrixFunctions/ |
D | arm_mat_mult_q7.c | 65 q7_t const *pInB = (q7_t const *)pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q7_2x2_mve() 66 q7_t *pInA = pSrcA->pData; /* input data matrix pointer A */ in arm_mat_mult_q7_2x2_mve() 67 q7_t *pOut = pDst->pData; /* output data matrix pointer */ in arm_mat_mult_q7_2x2_mve() 69 q7_t *pInA0 = pInA; in arm_mat_mult_q7_2x2_mve() 70 q7_t *pInA1 = pInA0 + MATRIX_DIM; in arm_mat_mult_q7_2x2_mve() 87 pOut[0 * MATRIX_DIM] = (q7_t) __SSAT(acc0 >> 7, 8); in arm_mat_mult_q7_2x2_mve() 88 pOut[1 * MATRIX_DIM] = (q7_t) __SSAT(acc1 >> 7, 8); in arm_mat_mult_q7_2x2_mve() 99 pOut[0 * MATRIX_DIM] = (q7_t) __SSAT(acc0 >> 7, 8); in arm_mat_mult_q7_2x2_mve() 100 pOut[1 * MATRIX_DIM] = (q7_t) __SSAT(acc1 >> 7, 8); in arm_mat_mult_q7_2x2_mve() 114 q7_t const *pInB = (q7_t const *)pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q7_3x3_mve() [all …]
|
D | arm_mat_vec_mult_q7.c | 55 const q7_t *pSrcVec, in arm_mat_vec_mult_q7() 56 q7_t *pDstVec) in arm_mat_vec_mult_q7() 58 const q7_t *pMatSrc = pSrcMat->pData; in arm_mat_vec_mult_q7() 59 const q7_t *pMat0, *pMat1; in arm_mat_vec_mult_q7() 62 q7_t *px; in arm_mat_vec_mult_q7() 74 q7_t const *pMat0Vec, *pMat1Vec, *pMat2Vec, *pMat3Vec, *pVec; in arm_mat_vec_mult_q7() 75 const q7_t *pMat2, *pMat3; in arm_mat_vec_mult_q7() 76 q7_t const *pSrcVecPtr = pSrcVec; in arm_mat_vec_mult_q7() 160 q7_t const *pMat0Vec, *pMat1Vec, *pVec; in arm_mat_vec_mult_q7() 161 q7_t const *pSrcVecPtr = pSrcVec; in arm_mat_vec_mult_q7() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/NNSupportFunctions/ |
D | arm_nn_mat_mult_nt_t_s8.c | 48 arm_status arm_nn_mat_mult_nt_t_s8(const q7_t *lhs, in arm_nn_mat_mult_nt_t_s8() 49 const q7_t *rhs, in arm_nn_mat_mult_nt_t_s8() 51 q7_t *dst, in arm_nn_mat_mult_nt_t_s8() 67 const q7_t *lhs_ptr = &lhs[0]; in arm_nn_mat_mult_nt_t_s8() 68 q7_t *dst_ptr = &dst[0]; in arm_nn_mat_mult_nt_t_s8() 91 const q7_t *rhs_ptr = &rhs[0]; in arm_nn_mat_mult_nt_t_s8() 104 val1 = arm_nn_read_q7x4_ia((const q7_t **)&rhs_ptr); in arm_nn_mat_mult_nt_t_s8() 106 val0 = arm_nn_read_q7x4_ia((const q7_t **)&lhs_ptr); in arm_nn_mat_mult_nt_t_s8() 108 val4 = arm_nn_read_q7x4((const q7_t *)&rhs_ptr[off0]); in arm_nn_mat_mult_nt_t_s8() 121 val0 = arm_nn_read_q7x4((const q7_t *)&lhs_ptr[off0]); in arm_nn_mat_mult_nt_t_s8() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/FilteringFunctions/ |
D | arm_fir_q7.c | 61 const q7_t *pSmp = &pSample[j]; \ 69 *pOutput++ = (q7_t) __SSAT((acc[j] >> 7U), 8); \ 74 q7_t *pState = S->pState; /* State pointer */ \ 75 const q7_t *pCoeffs = S->pCoeffs; /* Coefficient pointer */ \ 76 q7_t *pStateCur; /* Points to the current sample of the state */ \ 77 const q7_t *pSamples; /* Temporary pointer to the sample buffer */ \ 78 q7_t *pOutput; /* Temporary pointer to the output buffer */ \ 79 const q7_t *pTempSrc; /* Temporary pointer to the source data */ \ 80 q7_t *pTempDest; /* Temporary pointer to the destination buffer */\ 145 const q7_t * __restrict pSrc, in arm_fir_q7_49_64_mve() [all …]
|
D | arm_conv_q7.c | 64 const q7_t * pSrcA, in arm_conv_q7() 66 const q7_t * pSrcB, in arm_conv_q7() 68 q7_t * pDst) in arm_conv_q7() 70 const q7_t *pIn1 = pSrcA; /* inputA pointer */ in arm_conv_q7() 71 const q7_t *pIn2 = pSrcB; /* inputB pointer */ in arm_conv_q7() 75 const q7_t *pX; in arm_conv_q7() 76 const q7_t *pY; in arm_conv_q7() 77 const q7_t *pA; in arm_conv_q7() 78 const q7_t *pB; in arm_conv_q7() 119 *pDst++ = (q7_t) acc0; in arm_conv_q7() [all …]
|
D | arm_correlate_q7.c | 64 const q7_t * pSrcA, in arm_correlate_q7() 66 const q7_t * pSrcB, in arm_correlate_q7() 68 q7_t * pDst) in arm_correlate_q7() 70 const q7_t *pIn1 = pSrcA; /* inputA pointer */ in arm_correlate_q7() 71 const q7_t *pIn2 = pSrcB + (srcBLen - 1U); /* inputB pointer */ in arm_correlate_q7() 72 const q7_t *pX, *pY; in arm_correlate_q7() 73 const q7_t *pA, *pB; in arm_correlate_q7() 141 *pDst = (q7_t) acc0; in arm_correlate_q7() 143 *pDst = (q7_t) acc1; in arm_correlate_q7() 156 *pDst = (q7_t) acc; in arm_correlate_q7() [all …]
|
D | arm_fir_sparse_q7.c | 61 const q7_t * pSrc, in arm_fir_sparse_q7() 62 q7_t * pDst, in arm_fir_sparse_q7() 63 q7_t * pScratchIn, in arm_fir_sparse_q7() 67 q7_t *pState = S->pState; /* State pointer */ in arm_fir_sparse_q7() 68 const q7_t *pCoeffs = S->pCoeffs; /* Coefficient pointer */ in arm_fir_sparse_q7() 69 q7_t *px; /* Scratch buffer pointer */ in arm_fir_sparse_q7() 70 q7_t *py = pState; /* Temporary pointers for state buffer */ in arm_fir_sparse_q7() 71 q7_t *pb = pScratchIn; /* Temporary pointers for scratch buffer */ in arm_fir_sparse_q7() 72 q7_t *pOut = pDst; /* Destination pointer */ in arm_fir_sparse_q7() 80 q7_t coeff = *pCoeffs++; /* Read the coefficient value */ in arm_fir_sparse_q7() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/BasicMathFunctions/ |
D | arm_abs_q7.c | 59 const q7_t * pSrc, in arm_abs_q7() 60 q7_t * pDst, in arm_abs_q7() 100 const q7_t * pSrc, in arm_abs_q7() 101 q7_t * pDst, in arm_abs_q7() 105 q7_t in; /* Temporary input variable */ in arm_abs_q7() 119 *pDst++ = (in > 0) ? in : (q7_t)__QSUB8(0, in); in arm_abs_q7() 121 *pDst++ = (in > 0) ? in : ((in == (q7_t) 0x80) ? (q7_t) 0x7f : -in); in arm_abs_q7() 126 *pDst++ = (in > 0) ? in : (q7_t)__QSUB8(0, in); in arm_abs_q7() 128 *pDst++ = (in > 0) ? in : ((in == (q7_t) 0x80) ? (q7_t) 0x7f : -in); in arm_abs_q7() 133 *pDst++ = (in > 0) ? in : (q7_t)__QSUB8(0, in); in arm_abs_q7() [all …]
|
D | arm_negate_q7.c | 56 const q7_t * pSrc, in arm_negate_q7() 57 q7_t * pDst, in arm_negate_q7() 97 const q7_t * pSrc, in arm_negate_q7() 98 q7_t * pDst, in arm_negate_q7() 102 q7_t in; /* Temporary input variable */ in arm_negate_q7() 119 in1 = read_q7x4_ia ((q7_t **) &pSrc); in arm_negate_q7() 123 *pDst++ = (in == (q7_t) 0x80) ? (q7_t) 0x7f : -in; in arm_negate_q7() 126 *pDst++ = (in == (q7_t) 0x80) ? (q7_t) 0x7f : -in; in arm_negate_q7() 129 *pDst++ = (in == (q7_t) 0x80) ? (q7_t) 0x7f : -in; in arm_negate_q7() 132 *pDst++ = (in == (q7_t) 0x80) ? (q7_t) 0x7f : -in; in arm_negate_q7() [all …]
|
D | arm_scale_q7.c | 60 const q7_t * pSrc, in arm_scale_q7() 61 q7_t scaleFract, in arm_scale_q7() 63 q7_t * pDst, in arm_scale_q7() 111 const q7_t * pSrc, in arm_scale_q7() 112 q7_t scaleFract, in arm_scale_q7() 114 q7_t * pDst, in arm_scale_q7() 123 q7_t in1, in2, in3, in4; /* Temporary input variables */ in arm_scale_q7() 124 q7_t out1, out2, out3, out4; /* Temporary output variables */ in arm_scale_q7() 142 out1 = (q7_t) (__SSAT(((in1) * scaleFract) >> kShift, 8)); in arm_scale_q7() 143 out2 = (q7_t) (__SSAT(((in2) * scaleFract) >> kShift, 8)); in arm_scale_q7() [all …]
|
D | arm_mult_q7.c | 57 const q7_t * pSrcA, in arm_mult_q7() 58 const q7_t * pSrcB, in arm_mult_q7() 59 q7_t * pDst, in arm_mult_q7() 102 const q7_t * pSrcA, in arm_mult_q7() 103 const q7_t * pSrcB, in arm_mult_q7() 104 q7_t * pDst, in arm_mult_q7() 112 q7_t out1, out2, out3, out4; /* Temporary output variables */ in arm_mult_q7() 124 out1 = (q7_t) __SSAT((((q15_t) (*pSrcA++) * (*pSrcB++)) >> 7), 8); in arm_mult_q7() 125 out2 = (q7_t) __SSAT((((q15_t) (*pSrcA++) * (*pSrcB++)) >> 7), 8); in arm_mult_q7() 126 out3 = (q7_t) __SSAT((((q15_t) (*pSrcA++) * (*pSrcB++)) >> 7), 8); in arm_mult_q7() [all …]
|
D | arm_sub_q7.c | 57 const q7_t * pSrcA, in arm_sub_q7() 58 const q7_t * pSrcB, in arm_sub_q7() 59 q7_t * pDst, in arm_sub_q7() 102 const q7_t * pSrcA, in arm_sub_q7() 103 const q7_t * pSrcB, in arm_sub_q7() 104 q7_t * pDst, in arm_sub_q7() 120 … write_q7x4_ia (&pDst, __QSUB8(read_q7x4_ia ((q7_t **) &pSrcA), read_q7x4_ia ((q7_t **) &pSrcB))); in arm_sub_q7() 122 *pDst++ = (q7_t) __SSAT((q15_t) *pSrcA++ - *pSrcB++, 8); in arm_sub_q7() 123 *pDst++ = (q7_t) __SSAT((q15_t) *pSrcA++ - *pSrcB++, 8); in arm_sub_q7() 124 *pDst++ = (q7_t) __SSAT((q15_t) *pSrcA++ - *pSrcB++, 8); in arm_sub_q7() [all …]
|
D | arm_add_q7.c | 59 const q7_t * pSrcA, in arm_add_q7() 60 const q7_t * pSrcB, in arm_add_q7() 61 q7_t * pDst, in arm_add_q7() 104 const q7_t * pSrcA, in arm_add_q7() 105 const q7_t * pSrcB, in arm_add_q7() 106 q7_t * pDst, in arm_add_q7() 122 … write_q7x4_ia (&pDst, __QADD8 (read_q7x4_ia ((q7_t **) &pSrcA), read_q7x4_ia ((q7_t **) &pSrcB))); in arm_add_q7() 124 *pDst++ = (q7_t) __SSAT ((q15_t) *pSrcA++ + *pSrcB++, 8); in arm_add_q7() 125 *pDst++ = (q7_t) __SSAT ((q15_t) *pSrcA++ + *pSrcB++, 8); in arm_add_q7() 126 *pDst++ = (q7_t) __SSAT ((q15_t) *pSrcA++ + *pSrcB++, 8); in arm_add_q7() [all …]
|
D | arm_offset_q7.c | 57 const q7_t * pSrc, in arm_offset_q7() 58 q7_t offset, in arm_offset_q7() 59 q7_t * pDst, in arm_offset_q7() 99 const q7_t * pSrc, in arm_offset_q7() 100 q7_t offset, in arm_offset_q7() 101 q7_t * pDst, in arm_offset_q7() 124 write_q7x4_ia (&pDst, __QADD8(read_q7x4_ia ((q7_t **) &pSrc), offset_packed)); in arm_offset_q7() 126 *pDst++ = (q7_t) __SSAT((q15_t) *pSrc++ + offset, 8); in arm_offset_q7() 127 *pDst++ = (q7_t) __SSAT((q15_t) *pSrc++ + offset, 8); in arm_offset_q7() 128 *pDst++ = (q7_t) __SSAT((q15_t) *pSrc++ + offset, 8); in arm_offset_q7() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/FullyConnectedFunctions/ |
D | arm_fully_connected_q7_opt.c | 128 arm_status arm_fully_connected_q7_opt(const q7_t *pV, in arm_fully_connected_q7_opt() 129 const q7_t *pM, in arm_fully_connected_q7_opt() 134 const q7_t *bias, in arm_fully_connected_q7_opt() 135 q7_t *pOut, in arm_fully_connected_q7_opt() 142 const q7_t *pB = pM; in arm_fully_connected_q7_opt() 143 q7_t *pO = pOut; in arm_fully_connected_q7_opt() 144 const q7_t *pBias = bias; in arm_fully_connected_q7_opt() 323 q7_t inM = *pB++; in arm_fully_connected_q7_opt() 324 q7_t inM2 = *pB++; in arm_fully_connected_q7_opt() 325 q7_t inM3 = *pB++; in arm_fully_connected_q7_opt() [all …]
|
D | arm_fully_connected_q7.c | 67 arm_status arm_fully_connected_q7(const q7_t *pV, in arm_fully_connected_q7() 68 const q7_t *pM, in arm_fully_connected_q7() 73 const q7_t *bias, in arm_fully_connected_q7() 74 q7_t *pOut, in arm_fully_connected_q7() 81 const q7_t *pB = pM; in arm_fully_connected_q7() 82 const q7_t *pB2; in arm_fully_connected_q7() 83 q7_t *pO = pOut; in arm_fully_connected_q7() 84 const q7_t *pBias = bias; in arm_fully_connected_q7() 121 q7_t inV = *pA++; in arm_fully_connected_q7() 129 *pO++ = (q7_t)(__SSAT((sum >> out_shift), 8)); in arm_fully_connected_q7() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/StatisticsFunctions/ |
D | arm_absmin_q7.c | 57 const q7_t *pSrc, in arm_small_blk_absmin_q7() 59 q7_t *pResult, in arm_small_blk_absmin_q7() 64 q7_t const *pSrcVec; in arm_small_blk_absmin_q7() 66 q7_t minValue = Q7_ABSMAX; in arm_small_blk_absmin_q7() 77 pSrcVec = (q7_t const *) pSrc; in arm_small_blk_absmin_q7() 136 const q7_t * pSrc, in arm_absmin_q7() 138 q7_t * pResult, in arm_absmin_q7() 150 q7_t curBlkExtr = Q7_MAX; in arm_absmin_q7() 158 const q7_t *curSrc = pSrc; in arm_absmin_q7() 192 const q7_t * pSrc, in arm_absmin_q7() [all …]
|
D | arm_absmax_q7.c | 57 const q7_t * pSrc, in arm_small_blk_absmax_q7() 59 q7_t * pResult, in arm_small_blk_absmax_q7() 64 q7_t maxValue = Q7_ABSMIN; in arm_small_blk_absmax_q7() 108 const q7_t * pSrc, in arm_absmax_q7() 110 q7_t * pResult, in arm_absmax_q7() 122 q7_t curBlkExtr = Q7_MIN; in arm_absmax_q7() 130 const q7_t *curSrc = pSrc; in arm_absmax_q7() 163 const q7_t * pSrc, in arm_absmax_q7() 165 q7_t * pResult, in arm_absmax_q7() 168 … q7_t cur_absmax, out; /* Temporary variables to store the output value. */\ in arm_absmax_q7() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Include/dsp/ |
D | basic_math_functions.h | 54 const q7_t * pSrcA, 55 const q7_t * pSrcB, 56 q7_t * pDst, 126 const q7_t * pSrcA, 127 const q7_t * pSrcB, 128 q7_t * pDst, 183 const q7_t * pSrcA, 184 const q7_t * pSrcB, 185 q7_t * pDst, 241 const q7_t * pSrc, [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/PoolingFunctions/ |
D | arm_pool_q7_HWC.c | 42 static void buffer_scale_back_q15_to_q7(q15_t *buffer, q7_t *target, uint16_t length, uint16_t scal… in buffer_scale_back_q15_to_q7() 48 target[i] = (q7_t)(buffer[i] / scale); in buffer_scale_back_q15_to_q7() 52 static void compare_and_replace_if_larger_q7(q7_t *base, // base data in compare_and_replace_if_larger_q7() 53 const q7_t *target, // compare target in compare_and_replace_if_larger_q7() 57 q7_t *pIn = base; in compare_and_replace_if_larger_q7() 58 const q7_t *pCom = target; in compare_and_replace_if_larger_q7() 65 in.word = arm_nn_read_q7x4((const q7_t *)pIn); in compare_and_replace_if_larger_q7() 66 com.word = arm_nn_read_q7x4_ia((const q7_t **)&pCom); in compare_and_replace_if_larger_q7() 96 static void accumulate_q7_to_q15(q15_t *base, q7_t *target, const uint16_t length) in accumulate_q7_to_q15() 99 q7_t *pV = target; in accumulate_q7_to_q15() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/ConvolutionFunctions/ |
D | arm_nn_mat_mult_kernel_q7_q15.c | 40 q7_t *arm_nn_mat_mult_kernel_q7_q15(const q7_t *pA, in arm_nn_mat_mult_kernel_q7_q15() 46 const q7_t *bias, in arm_nn_mat_mult_kernel_q7_q15() 47 q7_t *pOut) in arm_nn_mat_mult_kernel_q7_q15() 51 q7_t *pOut2 = pOut + ch_im_out; in arm_nn_mat_mult_kernel_q7_q15() 52 const q7_t *pBias = bias; in arm_nn_mat_mult_kernel_q7_q15() 63 const q7_t *pA2 = pA + numCol_A; in arm_nn_mat_mult_kernel_q7_q15() 101 q7_t inA1 = *pA++; in arm_nn_mat_mult_kernel_q7_q15() 103 q7_t inA2 = *pA2++; in arm_nn_mat_mult_kernel_q7_q15() 112 *pOut++ = (q7_t)__SSAT((sum >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15() 113 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15() [all …]
|
D | arm_depthwise_separable_conv_HWC_q7.c | 82 arm_status arm_depthwise_separable_conv_HWC_q7(const q7_t *Im_in, in arm_depthwise_separable_conv_HWC_q7() 85 const q7_t *wt, in arm_depthwise_separable_conv_HWC_q7() 90 const q7_t *bias, in arm_depthwise_separable_conv_HWC_q7() 93 q7_t *Im_out, in arm_depthwise_separable_conv_HWC_q7() 96 q7_t *bufferB) in arm_depthwise_separable_conv_HWC_q7() 104 q7_t *colBuffer = (q7_t *)bufferA; in arm_depthwise_separable_conv_HWC_q7() 105 q7_t *pBuffer = colBuffer; in arm_depthwise_separable_conv_HWC_q7() 106 const q7_t *pBias = bias; in arm_depthwise_separable_conv_HWC_q7() 107 q7_t *pOut = Im_out; in arm_depthwise_separable_conv_HWC_q7() 135 … memcpy(pBuffer, (q7_t *)Im_in + (i_ker_y * dim_im_in + i_ker_x) * ch_im_in, ch_im_in); in arm_depthwise_separable_conv_HWC_q7() [all …]
|
D | arm_depthwise_separable_conv_HWC_q7_nonsquare.c | 74 arm_status arm_depthwise_separable_conv_HWC_q7_nonsquare(const q7_t *Im_in, in arm_depthwise_separable_conv_HWC_q7_nonsquare() 78 const q7_t *wt, in arm_depthwise_separable_conv_HWC_q7_nonsquare() 86 const q7_t *bias, in arm_depthwise_separable_conv_HWC_q7_nonsquare() 89 q7_t *Im_out, in arm_depthwise_separable_conv_HWC_q7_nonsquare() 93 q7_t *bufferB) in arm_depthwise_separable_conv_HWC_q7_nonsquare() 112 q7_t *colBuffer = (q7_t *)bufferA; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 113 q7_t *pBuffer = colBuffer; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 114 const q7_t *pBias = bias; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 115 q7_t *pOut = Im_out; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 145 … memcpy(pBuffer, (q7_t *)Im_in + (i_ker_y * dim_im_in_x + i_ker_x) * ch_im_in, ch_im_in); in arm_depthwise_separable_conv_HWC_q7_nonsquare() [all …]
|