/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/FullyConnectedFunctions/ |
D | arm_fully_connected_q7_opt.c | 142 const q7_t *pB = pM; in arm_fully_connected_q7_opt() local 171 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 176 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 183 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 188 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 202 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 207 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 214 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 219 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_q7_opt() 273 [ pB ] "+r"(pB), in arm_fully_connected_q7_opt() [all …]
|
D | arm_fully_connected_q15_opt.c | 110 const q15_t *pB = pM; in arm_fully_connected_q15_opt() local 136 inM11 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15_opt() 138 inM12 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15_opt() 140 inM13 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15_opt() 142 inM14 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15_opt() 174 [ pB ] "+r"(pB), in arm_fully_connected_q15_opt() 186 q15_t inM = *pB++; in arm_fully_connected_q15_opt() 187 q15_t inM2 = *pB++; in arm_fully_connected_q15_opt() 188 q15_t inM3 = *pB++; in arm_fully_connected_q15_opt() 189 q15_t inM4 = *pB++; in arm_fully_connected_q15_opt() [all …]
|
D | arm_fully_connected_mat_q7_vec_q15_opt.c | 131 const q7_t *pB = pM; in arm_fully_connected_mat_q7_vec_q15_opt() local 159 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_mat_q7_vec_q15_opt() 164 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_mat_q7_vec_q15_opt() 180 inM11 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_mat_q7_vec_q15_opt() 185 inM13 = arm_nn_read_q7x4_ia(&pB); in arm_fully_connected_mat_q7_vec_q15_opt() 227 [ pB ] "+r"(pB), in arm_fully_connected_mat_q7_vec_q15_opt() 252 [ pB ] "+r"(pB), in arm_fully_connected_mat_q7_vec_q15_opt() 264 q7_t inM = *pB++; in arm_fully_connected_mat_q7_vec_q15_opt() 265 q7_t inM2 = *pB++; in arm_fully_connected_mat_q7_vec_q15_opt() 266 q7_t inM3 = *pB++; in arm_fully_connected_mat_q7_vec_q15_opt() [all …]
|
D | arm_fully_connected_q15.c | 79 const q15_t *pB = pM; in arm_fully_connected_q15() local 80 const q15_t *pB2 = pB + dim_vec; in arm_fully_connected_q15() 95 pB2 = pB + dim_vec; in arm_fully_connected_q15() 101 inM1 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15() 107 inM1 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15() 118 q15_t inM = *pB++; in arm_fully_connected_q15() 129 pB = pB + dim_vec; in arm_fully_connected_q15() 147 inM1 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15() 151 inM1 = arm_nn_read_q15x2_ia(&pB); in arm_fully_connected_q15() 162 q15_t inM = *pB++; in arm_fully_connected_q15()
|
D | arm_fully_connected_mat_q7_vec_q15.c | 82 const q7_t *pB = pM; in arm_fully_connected_mat_q7_vec_q15() local 97 pB2 = pB + dim_vec; in arm_fully_connected_mat_q7_vec_q15() 102 pB = read_and_pad(pB, &inM11, &inM12); in arm_fully_connected_mat_q7_vec_q15() 121 q7_t inM = *pB++; in arm_fully_connected_mat_q7_vec_q15() 132 pB += dim_vec; in arm_fully_connected_mat_q7_vec_q15() 150 pB = read_and_pad(pB, &inM11, &inM12); in arm_fully_connected_mat_q7_vec_q15() 166 q7_t inM = *pB++; in arm_fully_connected_mat_q7_vec_q15()
|
D | arm_fully_connected_q7.c | 81 const q7_t *pB = pM; in arm_fully_connected_q7() local 98 pB2 = pB + dim_vec; in arm_fully_connected_q7() 103 pB = read_and_pad_reordered(pB, &inM11, &inM12); in arm_fully_connected_q7() 122 q15_t inM = *pB++; in arm_fully_connected_q7() 133 pB += dim_vec; in arm_fully_connected_q7() 151 pB = read_and_pad_reordered(pB, &inM11, &inM12); in arm_fully_connected_q7() 167 q15_t inM = *pB++; in arm_fully_connected_q7()
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Include/dsp/ |
D | distance_functions.h | 70 float32_t arm_euclidean_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 80 float32_t arm_braycurtis_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 95 float32_t arm_canberra_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 106 float32_t arm_chebyshev_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 117 float32_t arm_cityblock_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 130 float32_t arm_correlation_distance_f32(float32_t *pA,float32_t *pB, uint32_t blockSize); 142 float32_t arm_cosine_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize); 164 float32_t arm_jensenshannon_distance_f32(const float32_t *pA,const float32_t *pB,uint32_t blockSize… 179 float32_t arm_minkowski_distance_f32(const float32_t *pA,const float32_t *pB, int32_t order, uint32… 193 float32_t arm_dice_distance(const uint32_t *pA, const uint32_t *pB, uint32_t numberOfBools); [all …]
|
D | distance_functions_f16.h | 63 float16_t arm_euclidean_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 73 float16_t arm_braycurtis_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 88 float16_t arm_canberra_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 99 float16_t arm_chebyshev_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 110 float16_t arm_cityblock_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 123 float16_t arm_correlation_distance_f16(float16_t *pA,float16_t *pB, uint32_t blockSize); 135 float16_t arm_cosine_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize); 157 float16_t arm_jensenshannon_distance_f16(const float16_t *pA,const float16_t *pB,uint32_t blockSize… 172 float16_t arm_minkowski_distance_f16(const float16_t *pA,const float16_t *pB, int32_t order, uint32…
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/TransformFunctions/ |
D | arm_rfft_fast_f16.c | 46 float16_t *pB = p; /* decreasing pointer */ in stage_rfft_f16() local 66 xBR = pB[0]; in stage_rfft_f16() 67 xBI = pB[1]; in stage_rfft_f16() 86 pB = p + 2*k - 14; in stage_rfft_f16() 111 xB = vld2q_f16(pB); in stage_rfft_f16() 113 xB.val[0] = vldrhq_gather_shifted_offset_f16(pB, vecStridesBkwd); in stage_rfft_f16() 114 xB.val[1] = vldrhq_gather_shifted_offset_f16(&pB[1], vecStridesBkwd); in stage_rfft_f16() 117 pB -= 16; in stage_rfft_f16() 150 pB += 14; in stage_rfft_f16() 169 xBI = pB[1]; in stage_rfft_f16() [all …]
|
D | arm_rfft_fast_f32.c | 41 float32_t *pB = p; /* decreasing pointer */ in stage_rfft_f32() local 61 xBR = pB[0]; in stage_rfft_f32() 62 xBI = pB[1]; in stage_rfft_f32() 81 pB = p + 2*k; in stage_rfft_f32() 106 xB = vld2q_f32(pB); in stage_rfft_f32() 108 xB.val[0] = vldrwq_gather_shifted_offset_f32(pB, vecStridesBkwd); in stage_rfft_f32() 109 xB.val[1] = vldrwq_gather_shifted_offset_f32(&pB[1], vecStridesBkwd); in stage_rfft_f32() 112 pB -= 8; in stage_rfft_f32() 163 xBI = pB[1]; in stage_rfft_f32() 164 xBR = pB[0]; in stage_rfft_f32() [all …]
|
D | arm_rfft_fast_f64.c | 40 float64_t *pB = p; /* decreasing pointer */ in stage_rfft_f64() local 50 xBR = pB[0]; in stage_rfft_f64() 51 xBI = pB[1]; in stage_rfft_f64() 70 pB = p + 2*k; in stage_rfft_f64() 90 xBI = pB[1]; in stage_rfft_f64() 91 xBR = pB[0]; in stage_rfft_f64() 112 pB -= 2; in stage_rfft_f64() 127 float64_t *pB = p; /* decreasing pointer */ in merge_rfft_f64() local 141 pB = p + 2*k ; in merge_rfft_f64() 149 xBI = pB[1] ; in merge_rfft_f64() [all …]
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/DistanceFunctions/ |
D | arm_chebyshev_distance_f32.c | 55 float32_t arm_chebyshev_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_chebyshev_distance_f32() argument 67 vecB = vld1q(pB); in arm_chebyshev_distance_f32() 68 pB += 4; in arm_chebyshev_distance_f32() 87 vecB = vldrwq_z_f32(pB, p0); in arm_chebyshev_distance_f32() 106 float32_t arm_chebyshev_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_chebyshev_distance_f32() argument 116 tmpB = *pB++; in arm_chebyshev_distance_f32() 124 tmpB = *pB++; in arm_chebyshev_distance_f32() 137 b = vld1q_f32(pB); in arm_chebyshev_distance_f32() 139 pB += 4; in arm_chebyshev_distance_f32() 152 b = vld1q_f32(pB); in arm_chebyshev_distance_f32() [all …]
|
D | arm_cityblock_distance_f32.c | 53 float32_t arm_cityblock_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_cityblock_distance_f32() argument 63 b = vld1q(pB); in arm_cityblock_distance_f32() 69 pB += 4; in arm_cityblock_distance_f32() 82 b = vldrwq_z_f32(pB, p0); in arm_cityblock_distance_f32() 96 float32_t arm_cityblock_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_cityblock_distance_f32() argument 109 b = vld1q_f32(pB); in arm_cityblock_distance_f32() 115 pB += 4; in arm_cityblock_distance_f32() 127 tmpB = *pB++; in arm_cityblock_distance_f32() 136 float32_t arm_cityblock_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_cityblock_distance_f32() argument 144 tmpB = *pB++; in arm_cityblock_distance_f32()
|
D | arm_euclidean_distance_f32.c | 54 float32_t arm_euclidean_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_euclidean_distance_f32() argument 65 b = vld1q(pB); in arm_euclidean_distance_f32() 71 pB += 4; in arm_euclidean_distance_f32() 84 b = vldrwq_z_f32(pB, p0); in arm_euclidean_distance_f32() 98 float32_t arm_euclidean_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_euclidean_distance_f32() argument 110 b = vld1q_f32(pB); in arm_euclidean_distance_f32() 115 pB += 4; in arm_euclidean_distance_f32() 124 tmp = *pA++ - *pB++; in arm_euclidean_distance_f32() 133 float32_t arm_euclidean_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_euclidean_distance_f32() argument 139 tmp = *pA++ - *pB++; in arm_euclidean_distance_f32()
|
D | arm_braycurtis_distance_f32.c | 54 float32_t arm_braycurtis_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_braycurtis_distance_f32() argument 67 b = vld1q(pB); in arm_braycurtis_distance_f32() 77 pB += 4; in arm_braycurtis_distance_f32() 86 b = vldrwq_z_f32(pB, p0); in arm_braycurtis_distance_f32() 110 float32_t arm_braycurtis_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_braycurtis_distance_f32() argument 124 b = vld1q_f32(pB); in arm_braycurtis_distance_f32() 134 pB += 4; in arm_braycurtis_distance_f32() 146 accumDiff += fabsf(*pA - *pB); in arm_braycurtis_distance_f32() 147 accumSum += fabsf(*pA++ + *pB++); in arm_braycurtis_distance_f32() 160 float32_t arm_braycurtis_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_braycurtis_distance_f32() argument [all …]
|
D | arm_jensenshannon_distance_f32.c | 54 float32_t arm_jensenshannon_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSiz… in arm_jensenshannon_distance_f32() argument 65 b = vld1q(pB); in arm_jensenshannon_distance_f32() 79 pB += 4; in arm_jensenshannon_distance_f32() 92 b = vldrwq_z_f32(pB, p0); in arm_jensenshannon_distance_f32() 139 float32_t arm_jensenshannon_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSiz… in arm_jensenshannon_distance_f32() argument 153 bV = vld1q_f32(pB); in arm_jensenshannon_distance_f32() 167 pB += 4; in arm_jensenshannon_distance_f32() 180 b = *pB; in arm_jensenshannon_distance_f32() 186 pB++; in arm_jensenshannon_distance_f32() 221 float32_t arm_jensenshannon_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSiz… in arm_jensenshannon_distance_f32() argument [all …]
|
D | arm_minkowski_distance_f32.c | 76 float32_t arm_minkowski_distance_f32(const float32_t *pA,const float32_t *pB, int32_t order, uint32… in arm_minkowski_distance_f32() argument 86 b = vld1q(pB); in arm_minkowski_distance_f32() 93 pB += 4; in arm_minkowski_distance_f32() 106 b = vldrwq_z_f32(pB, p0); in arm_minkowski_distance_f32() 121 float32_t arm_minkowski_distance_f32(const float32_t *pA,const float32_t *pB, int32_t order, uint32… in arm_minkowski_distance_f32() argument 136 bV = vld1q_f32(pB); in arm_minkowski_distance_f32() 138 pB += 4; in arm_minkowski_distance_f32() 154 sum += powf(fabsf(*pA++ - *pB++),order); in arm_minkowski_distance_f32() 167 float32_t arm_minkowski_distance_f32(const float32_t *pA,const float32_t *pB, int32_t order, uint32… in arm_minkowski_distance_f32() argument 175 sum += powf(fabsf(pA[i] - pB[i]),order); in arm_minkowski_distance_f32()
|
D | arm_canberra_distance_f32.c | 60 float32_t arm_canberra_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_canberra_distance_f32() argument 71 b = vld1q(pB); in arm_canberra_distance_f32() 93 pB += 4; in arm_canberra_distance_f32() 102 b = vldrwq_z_f32(pB, p0); in arm_canberra_distance_f32() 134 float32_t arm_canberra_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_canberra_distance_f32() argument 149 b = vld1q_f32(pB); in arm_canberra_distance_f32() 172 pB += 4; in arm_canberra_distance_f32() 183 tmpB = *pB++; in arm_canberra_distance_f32() 197 float32_t arm_canberra_distance_f32(const float32_t *pA,const float32_t *pB, uint32_t blockSize) in arm_canberra_distance_f32() argument 204 tmpB = *pB++; in arm_canberra_distance_f32()
|
D | arm_chebyshev_distance_f16.c | 67 float16_t arm_chebyshev_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize) in arm_chebyshev_distance_f16() argument 79 vecB = vld1q(pB); in arm_chebyshev_distance_f16() 80 pB += 8; in arm_chebyshev_distance_f16() 99 vecB = vldrhq_z_f16(pB, p0); in arm_chebyshev_distance_f16() 114 float16_t arm_chebyshev_distance_f16(const float16_t *pA,const float16_t *pB, uint32_t blockSize) in arm_chebyshev_distance_f16() argument 119 tmpB = *pB++; in arm_chebyshev_distance_f16() 127 tmpB = *pB++; in arm_chebyshev_distance_f16()
|
D | arm_correlation_distance_f16.c | 66 float16_t arm_correlation_distance_f16(float16_t *pA,float16_t *pB, uint32_t blockSize) in arm_correlation_distance_f16() argument 71 arm_mean_f16(pB, blockSize, &mb); in arm_correlation_distance_f16() 74 arm_offset_f16(pB, -mb, pB, blockSize); in arm_correlation_distance_f16() 77 arm_power_f16(pB, blockSize, &pwrb); in arm_correlation_distance_f16() 79 arm_dot_prod_f16(pA,pB,blockSize,&dot); in arm_correlation_distance_f16()
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/NN/Source/ConvolutionFunctions/ |
D | arm_depthwise_separable_conv_HWC_q7.c | 154 q7_t *pB = colBuffer + row_shift; in arm_depthwise_separable_conv_HWC_q7() local 166 inB1 = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7() 167 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7() 168 opB = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7() 169 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7() 198 inB1 = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7() 199 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7() 200 opB = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7() 201 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7() 270 [ pB ] "+r"(pB), in arm_depthwise_separable_conv_HWC_q7() [all …]
|
D | arm_depthwise_separable_conv_HWC_q7_nonsquare.c | 164 q7_t *pB = colBuffer + row_shift; in arm_depthwise_separable_conv_HWC_q7_nonsquare() local 176 inB1 = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 177 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 178 opB = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 179 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 208 inB1 = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 209 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 210 opB = arm_nn_read_q7x4(pB); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 211 pB += ch_im_in; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 277 [ pB ] "+r"(pB), in arm_depthwise_separable_conv_HWC_q7_nonsquare() [all …]
|
D | arm_nn_mat_mult_kernel_q7_q15.c | 59 const q15_t *pB = pInBuffer; in arm_nn_mat_mult_kernel_q7_q15() local 60 const q15_t *pB2 = pB + numCol_A; in arm_nn_mat_mult_kernel_q7_q15() 77 q31_t inB1 = arm_nn_read_q15x2_ia(&pB); in arm_nn_mat_mult_kernel_q7_q15() 88 inB1 = arm_nn_read_q15x2_ia(&pB); in arm_nn_mat_mult_kernel_q7_q15() 102 q15_t inB1 = *pB++; in arm_nn_mat_mult_kernel_q7_q15() 126 const q15_t *pB = pInBuffer; in arm_nn_mat_mult_kernel_q7_q15() local 127 const q15_t *pB2 = pB + numCol_A; in arm_nn_mat_mult_kernel_q7_q15() 138 q31_t inB1 = arm_nn_read_q15x2_ia(&pB); in arm_nn_mat_mult_kernel_q7_q15() 146 inB1 = arm_nn_read_q15x2_ia(&pB); in arm_nn_mat_mult_kernel_q7_q15() 158 q15_t inB1 = *pB++; in arm_nn_mat_mult_kernel_q7_q15()
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/StatisticsFunctions/ |
D | arm_kullback_leibler_f32.c | 63 float32_t accum, pA,pB; in arm_kullback_leibler_f32() local 96 pB = *pSrcB++; in arm_kullback_leibler_f32() 97 accum += pA * logf(pB / pA); in arm_kullback_leibler_f32() 115 float32_t accum, pA,pB; in arm_kullback_leibler_f32() local 153 pB = *pInB++; in arm_kullback_leibler_f32() 154 accum += pA * logf(pB/pA); in arm_kullback_leibler_f32() 168 float32_t accum, pA,pB; in arm_kullback_leibler_f32() local 179 pB = *pInB++; in arm_kullback_leibler_f32() 180 accum += pA * logf(pB / pA); in arm_kullback_leibler_f32()
|
/hal_nxp-3.5.0/mcux/mcux-sdk/CMSIS/DSP/Source/SupportFunctions/ |
D | arm_merge_sort_f32.c | 33 …wnMerge(float32_t * pA, uint32_t begin, uint32_t middle, uint32_t end, float32_t * pB, uint8_t dir) in topDownMerge() argument 50 pB[k] = pA[i]; in topDownMerge() 55 pB[k] = pA[j]; in topDownMerge() 61 static void arm_merge_sort_core_f32(float32_t * pB, uint32_t begin, uint32_t end, float32_t * pA, u… in arm_merge_sort_core_f32() argument 67 arm_merge_sort_core_f32(pA, begin, middle, pB, dir); // Sort the left part in arm_merge_sort_core_f32() 68 arm_merge_sort_core_f32(pA, middle, end, pB, dir); // Sort the right part in arm_merge_sort_core_f32() 70 topDownMerge(pB, begin, middle, end, pA, dir); in arm_merge_sort_core_f32()
|