/cmsis-dsp-latest/Source/MatrixFunctions/ |
D | arm_mat_mult_fast_q31.c | 76 q31_t sum1, sum2, sum3, sum4; /* Accumulator */ in arm_mat_mult_fast_q31() local 125 sum3 = 0; in arm_mat_mult_fast_q31() 149 sum3 = __SMMLA(inA2, inB1, sum3); in arm_mat_mult_fast_q31() 154 sum3 = (q31_t) ((((q63_t) sum3 << 32) + ((q63_t) inA2 * inB1)) >> 32); in arm_mat_mult_fast_q31() 165 *px2++ = sum3 << 1; in arm_mat_mult_fast_q31()
|
D | arm_mat_mult_fast_q15.c | 88 q31_t sum2, sum3, sum4; in arm_mat_mult_fast_q15() local 255 sum3 = 0; in arm_mat_mult_fast_q15() 283 sum3 = __SMLAD(inA2, inB1, sum3); in arm_mat_mult_fast_q15() 318 sum3 += inA2 * inB1; in arm_mat_mult_fast_q15() 339 *px2++ = (q15_t) (sum3 >> 15); in arm_mat_mult_fast_q15()
|
D | arm_mat_vec_mult_q7.c | 307 q31_t sum3 = 0; in arm_mat_vec_mult_q7() local 345 sum3 = __SMLAD(matData, vecData, sum3); in arm_mat_vec_mult_q7() 346 sum3 = __SMLAD(matData2, vecData2, sum3); in arm_mat_vec_mult_q7() 365 sum3 += *pInA3++ * vecData; in arm_mat_vec_mult_q7() 373 *px++ = (q7_t)(__SSAT((sum3 >> 7), 8)); in arm_mat_vec_mult_q7()
|
D | arm_mat_cholesky_f64.c | 97 float64_t sum0=0.0,sum1=0.0,sum2=0.0,sum3=0.0; in arm_mat_cholesky_f64() local 142 sum3 = vaddvq_f64(acc3); in arm_mat_cholesky_f64() 152 sum3 = sum3 + pG[i * n + k] * pG[(j + 3) * n + k]; in arm_mat_cholesky_f64() 160 pG[(j + 3) * n + i] -= sum3; in arm_mat_cholesky_f64()
|
D | arm_mat_vec_mult_q15.c | 295 q63_t sum3 = 0; in arm_mat_vec_mult_q15() local 322 sum3 = __SMLALD(matData, vecData, sum3); in arm_mat_vec_mult_q15() 336 sum3 += (q63_t)*pInA3++ * vecData; in arm_mat_vec_mult_q15() 343 *px++ = (q15_t)(__SSAT((sum3 >> 15), 16)); in arm_mat_vec_mult_q15()
|
D | arm_mat_cholesky_f32.c | 230 float32_t sum0=0.0f,sum1=0.0f,sum2=0.0f,sum3=0.0f; in arm_mat_cholesky_f32() local 275 sum3 = vpadds_f32(vpadd_f32(vget_low_f32(acc3), vget_high_f32(acc3))); in arm_mat_cholesky_f32() 288 sum3 = vget_lane_f32(tmp, 0) + vget_lane_f32(tmp, 1); in arm_mat_cholesky_f32() 298 sum3 = sum3 + pG[i * n + k] * pG[(j + 3) * n + k]; in arm_mat_cholesky_f32() 306 pG[(j + 3) * n + i] -= sum3; in arm_mat_cholesky_f32()
|
D | arm_mat_mult_f64.c | 100 float64_t sum0,sum1, sum2,sum3, sum4, sum5 , sum6, sum7; in arm_mat_mult_f64() local 146 sum3 = 0.0; in arm_mat_mult_f64() 218 sum3 += vaddvq_f64(acc3); in arm_mat_mult_f64() 234 sum3 += *pIn1D++ * (*pIn2); in arm_mat_mult_f64() 249 *pxD++ = sum3; in arm_mat_mult_f64()
|
D | arm_mat_vec_mult_f32.c | 317 float32_t sum3 = 0.0f; in arm_mat_vec_mult_f32() local 344 sum3 += matData * vecData; in arm_mat_vec_mult_f32() 355 *px++ = sum3; in arm_mat_vec_mult_f32()
|
D | arm_mat_vec_mult_q31.c | 292 q63_t sum3 = 0; in arm_mat_vec_mult_q31() local 320 sum3 += (q63_t)matData * vecData; in arm_mat_vec_mult_q31() 331 *px++ = (q31_t)(sum3 >> 31); in arm_mat_vec_mult_q31()
|
D | arm_mat_vec_mult_f16.c | 316 float16_t sum3 = 0.0f16; in arm_mat_vec_mult_f16() local 339 sum3 += (_Float16)matData * (_Float16)vecData; in arm_mat_vec_mult_f16() 350 *px++ = sum3; in arm_mat_vec_mult_f16()
|
D | arm_mat_mult_f32.c | 579 float32_t sum0,sum1, sum2,sum3, sum4, sum5 , sum6, sum7; in arm_mat_mult_f32() local 625 sum3 = 0.0f; in arm_mat_mult_f32() 707 sum3 += vget_lane_f32(accum, 0) + vget_lane_f32(accum, 1); in arm_mat_mult_f32() 731 sum3 += *pIn1D++ * (*pIn2); in arm_mat_mult_f32() 746 *pxD++ = sum3; in arm_mat_mult_f32()
|
/cmsis-dsp-latest/dsppp/Include/dsppp/Scalar/ |
D | matrix_multiply.hpp | 77 Acc sum3 = Acc{}; in _dot_m_v() 102 sum3 = inner::mac(sum3, matData, vecData); in _dot_m_v() 110 *px++ = inner::from_accumulator(sum3); in _dot_m_v()
|
/cmsis-dsp-latest/dsppp/Include/dsppp/DSP/ |
D | matrix_multiply.hpp | 154 ACC sum3 = ACC{}; in _dot_m_v() 185 sum3 = inner::vmacc(sum3, matData, vecData); in _dot_m_v() 201 sum3 = inner::mac(sum3,*pInA3++ , tmpData); in _dot_m_v() 208 *px++ = inner::from_accumulator(sum3); in _dot_m_v()
|