/cmsis-dsp-latest/Source/QuaternionMathFunctions/ |
D | arm_quaternion_inverse_f32.c | 63 f32x4_t vec1,vec2; in arm_quaternion_inverse_f32() local 69 vec1 = vld1q(pInputQuaternions); in arm_quaternion_inverse_f32() 70 vec2 = vmulq(vec1,vec1); in arm_quaternion_inverse_f32() 74 vec1 = vmulq_n_f32(vec1, 1.0f / squaredSum); in arm_quaternion_inverse_f32() 75 vec1 = vsetq_lane_f32(-vgetq_lane(vec1, 0),vec1,0); in arm_quaternion_inverse_f32() 76 vec1 = vnegq_f32(vec1); in arm_quaternion_inverse_f32() 78 vst1q(pInverseQuaternions, vec1); in arm_quaternion_inverse_f32()
|
D | arm_quaternion_conjugate_f32.c | 61 f32x4_t vec1; in arm_quaternion_conjugate_f32() local 65 vec1 = vld1q(pInputQuaternions); in arm_quaternion_conjugate_f32() 68 vec1 = vsetq_lane_f32(-vgetq_lane(vec1, 0),vec1,0); in arm_quaternion_conjugate_f32() 69 vec1 = vnegq_f32(vec1); in arm_quaternion_conjugate_f32() 71 vst1q(pConjugateQuaternions, vec1); in arm_quaternion_conjugate_f32()
|
D | arm_quaternion_normalize_f32.c | 62 f32x4_t vec1,vec2; in arm_quaternion_normalize_f32() local 67 vec1 = vld1q(pInputQuaternions); in arm_quaternion_normalize_f32() 68 vec2 = vmulq(vec1,vec1); in arm_quaternion_normalize_f32() 71 vec1 = vmulq_n_f32(vec1, 1.0f / norm); in arm_quaternion_normalize_f32() 72 vst1q(pNormalizedQuaternions, vec1); in arm_quaternion_normalize_f32()
|
D | arm_quaternion_norm_f32.c | 63 f32x4_t vec1; in arm_quaternion_norm_f32() local 68 vec1 = vld1q(pInputQuaternions); in arm_quaternion_norm_f32() 69 vec1 = vmulq(vec1,vec1); in arm_quaternion_norm_f32() 70 squaredSum = vecAddAcrossF32Mve(vec1); in arm_quaternion_norm_f32()
|
D | arm_quaternion2rotation_f32.c | 84 f32x4_t vec0,vec1, vec2 ,vec3; in arm_quaternion2rotation_f32() local 94 vec1 = vmulq(vec0,vec0); in arm_quaternion2rotation_f32() 113 vec0 = vsetq_lane(vgetq_lane(vec1,0) + vgetq_lane(vec1,1),vec0,0); in arm_quaternion2rotation_f32() 114 vec0 = vsetq_lane(vgetq_lane(vec0,0) - vgetq_lane(vec1,2),vec0,0); in arm_quaternion2rotation_f32() 115 vec0 = vsetq_lane(vgetq_lane(vec0,0) - vgetq_lane(vec1,3),vec0,0); in arm_quaternion2rotation_f32() 123 tmp1 = vgetq_lane(vec1,0) - vgetq_lane(vec1,1); in arm_quaternion2rotation_f32() 124 tmp2 = vgetq_lane(vec1,2) - vgetq_lane(vec1,3); in arm_quaternion2rotation_f32()
|
/cmsis-dsp-latest/Source/BasicMathFunctions/ |
D | arm_negate_f32.c | 71 f32x4_t vec1; in arm_negate_f32() local 82 vec1 = vld1q(pSrc); in arm_negate_f32() 83 res = vnegq(vec1); in arm_negate_f32() 100 vec1 = vld1q((float32_t const *) pSrc); in arm_negate_f32() 101 vstrwq_p(pDst, vnegq(vec1), p0); in arm_negate_f32() 115 f32x4_t vec1; in arm_negate_f32() local 126 vec1 = vld1q_f32(pSrc); in arm_negate_f32() 127 res = vnegq_f32(vec1); in arm_negate_f32()
|
D | arm_abs_f32.c | 73 f32x4_t vec1; in arm_abs_f32() local 85 vec1 = vld1q(pSrc); in arm_abs_f32() 86 res = vabsq(vec1); in arm_abs_f32() 105 vec1 = vld1q(pSrc); in arm_abs_f32() 106 vstrwq_p(pDst, vabsq(vec1), p0); in arm_abs_f32() 120 f32x4_t vec1; in arm_abs_f32() local 131 vec1 = vld1q_f32(pSrc); in arm_abs_f32() 132 res = vabsq_f32(vec1); in arm_abs_f32()
|
D | arm_offset_f32.c | 74 f32x4_t vec1; in arm_offset_f32() local 84 vec1 = vld1q(pSrc); in arm_offset_f32() 85 res = vaddq(vec1,offset); in arm_offset_f32() 102 vec1 = vld1q((float32_t const *) pSrc); in arm_offset_f32() 103 vstrwq_p(pDst, vaddq(vec1, offset), p0); in arm_offset_f32() 119 f32x4_t vec1; in arm_offset_f32() local 130 vec1 = vld1q_f32(pSrc); in arm_offset_f32() 131 res = vaddq_f32(vec1,vdupq_n_f32(offset)); in arm_offset_f32()
|
D | arm_abs_f16.c | 60 f16x8_t vec1; in arm_abs_f16() local 72 vec1 = vld1q(pSrc); in arm_abs_f16() 73 res = vabsq(vec1); in arm_abs_f16() 92 vec1 = vld1q(pSrc); in arm_abs_f16() 93 vstrhq_p(pDst, vabsq(vec1), p0); in arm_abs_f16() 108 f16x8_t vec1; in arm_abs_f16() local 119 vec1 = vld1q_f16(pSrc); in arm_abs_f16() 120 res = vabsq_f16(vec1); in arm_abs_f16()
|
D | arm_mult_f32.c | 72 f32x4_t vec1; in arm_mult_f32() local 83 vec1 = vld1q(pSrcA); in arm_mult_f32() 85 res = vmulq(vec1, vec2); in arm_mult_f32() 103 vec1 = vld1q(pSrcA); in arm_mult_f32() 105 vstrwq_p(pDst, vmulq(vec1,vec2), p0); in arm_mult_f32() 120 f32x4_t vec1; in arm_mult_f32() local 132 vec1 = vld1q_f32(pSrcA); in arm_mult_f32() 134 res = vmulq_f32(vec1, vec2); in arm_mult_f32()
|
D | arm_sub_f32.c | 72 f32x4_t vec1; in arm_sub_f32() local 84 vec1 = vld1q(pSrcA); in arm_sub_f32() 86 res = vsubq(vec1, vec2); in arm_sub_f32() 105 vec1 = vld1q(pSrcA); in arm_sub_f32() 107 vstrwq_p(pDst, vsubq(vec1,vec2), p0); in arm_sub_f32() 122 f32x4_t vec1; in arm_sub_f32() local 134 vec1 = vld1q_f32(pSrcA); in arm_sub_f32() 136 res = vsubq_f32(vec1, vec2); in arm_sub_f32()
|
D | arm_scale_f32.c | 87 f32x4_t vec1; in arm_scale_f32() local 98 vec1 = vld1q(pSrc); in arm_scale_f32() 99 res = vmulq(vec1,scale); in arm_scale_f32() 116 vec1 = vld1q((float32_t const *) pSrc); in arm_scale_f32() 117 vstrwq_p(pDst, vmulq(vec1, scale), p0); in arm_scale_f32() 132 f32x4_t vec1; in arm_scale_f32() local 143 vec1 = vld1q_f32(pSrc); in arm_scale_f32() 144 res = vmulq_f32(vec1, vdupq_n_f32(scale)); in arm_scale_f32()
|
D | arm_add_f32.c | 72 f32x4_t vec1; in arm_add_f32() local 84 vec1 = vld1q(pSrcA); in arm_add_f32() 86 res = vaddq(vec1, vec2); in arm_add_f32() 105 vec1 = vld1q(pSrcA); in arm_add_f32() 107 vstrwq_p(pDst, vaddq(vec1,vec2), p0); in arm_add_f32() 122 f32x4_t vec1; in arm_add_f32() local 134 vec1 = vld1q_f32(pSrcA); in arm_add_f32() 136 res = vaddq_f32(vec1, vec2); in arm_add_f32()
|
D | arm_negate_f16.c | 58 f16x8_t vec1; in arm_negate_f16() local 69 vec1 = vld1q(pSrc); in arm_negate_f16() 70 res = vnegq(vec1); in arm_negate_f16() 87 vec1 = vld1q((float16_t const *) pSrc); in arm_negate_f16() 88 vstrhq_p(pDst, vnegq(vec1), p0); in arm_negate_f16()
|
D | arm_offset_f16.c | 60 f16x8_t vec1; in arm_offset_f16() local 70 vec1 = vld1q(pSrc); in arm_offset_f16() 71 res = vaddq(vec1,offset); in arm_offset_f16() 88 vec1 = vld1q((float16_t const *) pSrc); in arm_offset_f16() 89 vstrhq_p(pDst, vaddq(vec1, offset), p0); in arm_offset_f16()
|
D | arm_scale_f16.c | 62 f16x8_t vec1; in arm_scale_f16() local 73 vec1 = vld1q(pSrc); in arm_scale_f16() 74 res = vmulq(vec1,scale); in arm_scale_f16() 91 vec1 = vld1q((float16_t const *) pSrc); in arm_scale_f16() 92 vstrhq_p(pDst, vmulq(vec1, scale), p0); in arm_scale_f16()
|
D | arm_mult_f16.c | 62 f16x8_t vec1; in arm_mult_f16() local 73 vec1 = vld1q(pSrcA); in arm_mult_f16() 75 res = vmulq(vec1, vec2); in arm_mult_f16() 93 vec1 = vld1q(pSrcA); in arm_mult_f16() 95 vstrhq_p(pDst, vmulq(vec1,vec2), p0); in arm_mult_f16()
|
D | arm_sub_f16.c | 60 f16x8_t vec1; in arm_sub_f16() local 72 vec1 = vld1q(pSrcA); in arm_sub_f16() 74 res = vsubq(vec1, vec2); in arm_sub_f16() 93 vec1 = vld1q(pSrcA); in arm_sub_f16() 95 vstrhq_p(pDst, vsubq(vec1,vec2), p0); in arm_sub_f16()
|
D | arm_add_f16.c | 61 f16x8_t vec1; in arm_add_f16() local 73 vec1 = vld1q(pSrcA); in arm_add_f16() 75 res = vaddq(vec1, vec2); in arm_add_f16() 94 vec1 = vld1q(pSrcA); in arm_add_f16() 96 vstrhq_p(pDst, vaddq(vec1,vec2), p0); in arm_add_f16()
|
D | arm_dot_prod_f32.c | 131 f32x4_t vec1; in arm_dot_prod_f32() local 141 vec1 = vld1q_f32(pSrcA); in arm_dot_prod_f32() 149 accum = vmlaq_f32(accum, vec1, vec2); in arm_dot_prod_f32() 155 vec1 = vld1q_f32(pSrcA); in arm_dot_prod_f32()
|
/cmsis-dsp-latest/Source/SVMFunctions/ |
D | arm_svm_linear_predict_f32.c | 297 float32x4_t vec1; in arm_svm_linear_predict_f32() local 334 vec1 = vld1q_f32(pIn); in arm_svm_linear_predict_f32() 346 accuma = vmlaq_f32(accuma, vec1,vec2a); in arm_svm_linear_predict_f32() 347 accumb = vmlaq_f32(accumb, vec1,vec2b); in arm_svm_linear_predict_f32() 348 accumc = vmlaq_f32(accumc, vec1,vec2c); in arm_svm_linear_predict_f32() 349 accumd = vmlaq_f32(accumd, vec1,vec2d); in arm_svm_linear_predict_f32() 379 vec1 = vld1q_f32(pDualCoefs); in arm_svm_linear_predict_f32() 382 accum = vmulq_f32(vec1,dotV); in arm_svm_linear_predict_f32() 406 vec1 = vld1q_f32(pIn); in arm_svm_linear_predict_f32() 411 accum = vmlaq_f32(accum, vec1,vec2); in arm_svm_linear_predict_f32()
|
D | arm_svm_sigmoid_predict_f32.c | 315 float32x4_t vec1; in arm_svm_sigmoid_predict_f32() local 352 vec1 = vld1q_f32(pIn); in arm_svm_sigmoid_predict_f32() 364 accuma = vmlaq_f32(accuma, vec1,vec2a); in arm_svm_sigmoid_predict_f32() 365 accumb = vmlaq_f32(accumb, vec1,vec2b); in arm_svm_sigmoid_predict_f32() 366 accumc = vmlaq_f32(accumc, vec1,vec2c); in arm_svm_sigmoid_predict_f32() 367 accumd = vmlaq_f32(accumd, vec1,vec2d); in arm_svm_sigmoid_predict_f32() 397 vec1 = vld1q_f32(pDualCoefs); in arm_svm_sigmoid_predict_f32() 406 accum = vmulq_f32(vec1,dotV); in arm_svm_sigmoid_predict_f32() 431 vec1 = vld1q_f32(pIn); in arm_svm_sigmoid_predict_f32() 436 accum = vmlaq_f32(accum, vec1,vec2); in arm_svm_sigmoid_predict_f32()
|
D | arm_svm_polynomial_predict_f32.c | 317 float32x4_t vec1; in arm_svm_polynomial_predict_f32() local 354 vec1 = vld1q_f32(pIn); in arm_svm_polynomial_predict_f32() 366 accuma = vmlaq_f32(accuma, vec1,vec2a); in arm_svm_polynomial_predict_f32() 367 accumb = vmlaq_f32(accumb, vec1,vec2b); in arm_svm_polynomial_predict_f32() 368 accumc = vmlaq_f32(accumc, vec1,vec2c); in arm_svm_polynomial_predict_f32() 369 accumd = vmlaq_f32(accumd, vec1,vec2d); in arm_svm_polynomial_predict_f32() 399 vec1 = vld1q_f32(pDualCoefs); in arm_svm_polynomial_predict_f32() 408 accum = vmulq_f32(vec1,dotV); in arm_svm_polynomial_predict_f32() 433 vec1 = vld1q_f32(pIn); in arm_svm_polynomial_predict_f32() 438 accum = vmlaq_f32(accum, vec1,vec2); in arm_svm_polynomial_predict_f32()
|
D | arm_svm_rbf_predict_f32.c | 336 float32x4_t vec1; in arm_svm_rbf_predict_f32() local 373 vec1 = vld1q_f32(pIn); in arm_svm_rbf_predict_f32() 385 temp = vsubq_f32(vec1, vec2a); in arm_svm_rbf_predict_f32() 388 temp = vsubq_f32(vec1, vec2b); in arm_svm_rbf_predict_f32() 391 temp = vsubq_f32(vec1, vec2c); in arm_svm_rbf_predict_f32() 394 temp = vsubq_f32(vec1, vec2d); in arm_svm_rbf_predict_f32() 430 vec1 = vld1q_f32(pDualCoefs); in arm_svm_rbf_predict_f32() 437 accum = vmulq_f32(vec1,dotV); in arm_svm_rbf_predict_f32() 462 vec1 = vld1q_f32(pIn); in arm_svm_rbf_predict_f32() 467 temp = vsubq_f32(vec1,vec2); in arm_svm_rbf_predict_f32()
|
/cmsis-dsp-latest/Source/ComplexMathFunctions/ |
D | arm_cmplx_dot_prod_f32.c | 194 float32x4x2_t vec1,vec2,vec3,vec4; in arm_cmplx_dot_prod_f32() local 209 vec1 = vld2q_f32(pSrcA); in arm_cmplx_dot_prod_f32() 217 accR = vmlaq_f32(accR,vec1.val[0],vec2.val[0]); in arm_cmplx_dot_prod_f32() 218 accR = vmlsq_f32(accR,vec1.val[1],vec2.val[1]); in arm_cmplx_dot_prod_f32() 221 accI = vmlaq_f32(accI,vec1.val[1],vec2.val[0]); in arm_cmplx_dot_prod_f32() 222 accI = vmlaq_f32(accI,vec1.val[0],vec2.val[1]); in arm_cmplx_dot_prod_f32()
|