/cmsis-dsp-latest/Source/MatrixFunctions/ |
D | arm_mat_mult_fast_q31.c | 79 uint16_t numColsB = pSrcB->numCols; /* Number of columns of input matrix B */ in arm_mat_mult_fast_q31() local 103 px2 = px + numColsB; in arm_mat_mult_fast_q31() 110 col = numColsB; in arm_mat_mult_fast_q31() 144 pInB += numColsB; in arm_mat_mult_fast_q31() 175 px = px2 + (numColsB & 1U); in arm_mat_mult_fast_q31() 176 px2 = px + numColsB; in arm_mat_mult_fast_q31() 185 if (numColsB & 1U) { in arm_mat_mult_fast_q31() 191 px = pDst->pData + numColsB-1; in arm_mat_mult_fast_q31() 199 pInB = pSrcB->pData + numColsB-1; in arm_mat_mult_fast_q31() 217 pInB += numColsB; in arm_mat_mult_fast_q31() [all …]
|
D | arm_mat_mult_f64.c | 82 uint32_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_f64() local 122 pxB = px + numColsB; in arm_mat_mult_f64() 123 pxC = px + 2*numColsB; in arm_mat_mult_f64() 124 pxD = px + 3*numColsB; in arm_mat_mult_f64() 125 pxE = px + 4*numColsB; in arm_mat_mult_f64() 126 pxF = px + 5*numColsB; in arm_mat_mult_f64() 127 pxG = px + 6*numColsB; in arm_mat_mult_f64() 128 pxH = px + 7*numColsB; in arm_mat_mult_f64() 131 col = numColsB; in arm_mat_mult_f64() 197 pIn2 += numColsB; in arm_mat_mult_f64() [all …]
|
D | arm_mat_mult_f32.c | 295 int numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_f32() local 314 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_f32() 340 pOut1 = pOut0 + numColsB; in arm_mat_mult_f32() 341 pOut2 = pOut1 + numColsB; in arm_mat_mult_f32() 342 pOut3 = pOut2 + numColsB; in arm_mat_mult_f32() 345 uint32_t k = numColsB >> 2; in arm_mat_mult_f32() 373 pInB0 = pInB0 + numColsB; in arm_mat_mult_f32() 393 pInB0 -= (numColsB * numColsA) - 4; in arm_mat_mult_f32() 397 int colBLeft = numColsB & 3; in arm_mat_mult_f32() 425 pInB0 = pInB0 + numColsB; in arm_mat_mult_f32() [all …]
|
D | arm_mat_mult_f16.c | 391 int numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_f16() local 412 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_f16() 433 pOut1 = pOut0 + numColsB; in arm_mat_mult_f16() 434 pOut2 = pOut1 + numColsB; in arm_mat_mult_f16() 435 pOut3 = pOut2 + numColsB; in arm_mat_mult_f16() 438 int k = numColsB >> 3; in arm_mat_mult_f16() 466 pInB0 = pInB0 + numColsB; in arm_mat_mult_f16() 481 pInB0 -= (numColsB * numColsA) - 8; in arm_mat_mult_f16() 485 int colBLeft = numColsB & 7; in arm_mat_mult_f16() 513 pInB0 = pInB0 + numColsB; in arm_mat_mult_f16() [all …]
|
D | arm_mat_cmplx_mult_q15.c | 75 uint32_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_cmplx_mult_q15() local 101 vecColBOffs[2] = numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_q15() 102 vecColBOffs[3] = (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_q15() 103 vecColBOffs[4] = 2 * numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_q15() 104 vecColBOffs[5] = 2 * (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_q15() 105 vecColBOffs[6] = 3 * numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_q15() 106 vecColBOffs[7] = 3 * (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_q15() 127 col = numColsB >> 1; in arm_mat_cmplx_mult_q15() 180 vecOffs = vaddq_n_u16(vecOffs, (uint16_t) (numColsB * 4 * CMPLX_DIM)); in arm_mat_cmplx_mult_q15() 206 vecOffs = vaddq_n_u16(vecOffs, (uint16_t) (numColsB * 4 * CMPLX_DIM)); in arm_mat_cmplx_mult_q15() [all …]
|
D | arm_mat_mult_fast_q15.c | 79 uint16_t numColsB = pSrcB->numCols; /* Number of columns of input matrix B */ in arm_mat_mult_fast_q15() local 118 col = numColsB >> 2U; in arm_mat_mult_fast_q15() 196 col = numColsB % 0x4U; in arm_mat_mult_fast_q15() 225 px2 = px + numColsB; in arm_mat_mult_fast_q15() 233 col = numColsB; in arm_mat_mult_fast_q15() 353 px = px2 + (numColsB & 1U); in arm_mat_mult_fast_q15() 354 px2 = px + numColsB; in arm_mat_mult_fast_q15() 367 if (numColsB & 1U) { in arm_mat_mult_fast_q15() 373 px = pDst->pData + numColsB-1; in arm_mat_mult_fast_q15() 381 pInB = pSrcBT + numRowsB * (numColsB-1); in arm_mat_mult_fast_q15() [all …]
|
D | arm_mat_cmplx_mult_f16.c | 391 uint16_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_cmplx_mult_f16() local 417 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_f16() 435 vecColBOffs[2] = numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 436 vecColBOffs[3] = (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_f16() 437 vecColBOffs[4] = 2*numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 438 vecColBOffs[5] = 2*(numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_f16() 439 vecColBOffs[6] = 3*numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 440 vecColBOffs[7] = 3*(numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_f16() 456 i = i + 4 * numColsB; in arm_mat_cmplx_mult_f16() 460 col = numColsB; in arm_mat_cmplx_mult_f16() [all …]
|
D | arm_mat_cmplx_mult_f32.c | 533 uint16_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_cmplx_mult_f32() local 558 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_f32() 576 vecColBOffs[2] = numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_f32() 577 vecColBOffs[3] = (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_f32() 593 i = i + 4 * numColsB; in arm_mat_cmplx_mult_f32() 597 col = numColsB; in arm_mat_cmplx_mult_f32() 646 vecOffs = vecOffs + (uint32_t) (numColsB * 2 * CMPLX_DIM); in arm_mat_cmplx_mult_f32() 679 vecOffs = vecOffs + (uint32_t) (numColsB * 2 * CMPLX_DIM); in arm_mat_cmplx_mult_f32() 696 px[0 * CMPLX_DIM * numColsB + 0] = acc0[0] + acc0[2]; in arm_mat_cmplx_mult_f32() 697 px[0 * CMPLX_DIM * numColsB + 1] = acc0[1] + acc0[3]; in arm_mat_cmplx_mult_f32() [all …]
|
D | arm_mat_mult_q31.c | 345 uint16_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_q31() local 368 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q31() 384 vecColBOffs = vecColBOffs * (uint32_t) (numColsB); in arm_mat_mult_q31() 400 i = i + 4 * numColsB; in arm_mat_mult_q31() 404 col = numColsB; in arm_mat_mult_q31() 449 vecOffs = vecOffs + (uint32_t) (numColsB * 4); in arm_mat_mult_q31() 491 px[1 * numColsB] = (q31_t) acc1; in arm_mat_mult_q31() 492 px[2 * numColsB] = (q31_t) acc2; in arm_mat_mult_q31() 493 px[3 * numColsB] = (q31_t) acc3; in arm_mat_mult_q31() 502 pInB = (q31_t const *)pSrcB->pData + (numColsB - col); in arm_mat_mult_q31() [all …]
|
D | arm_mat_mult_opt_q31.c | 353 uint32_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_opt_q31() local 373 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_opt_q31() 392 BT.numRows = numColsB; in arm_mat_mult_opt_q31() 405 px2 = px + numColsB; in arm_mat_mult_opt_q31() 417 col = numColsB >> 1; in arm_mat_mult_opt_q31() 508 px = px2 + (numColsB & 1u); in arm_mat_mult_opt_q31() 509 px2 = px + numColsB; in arm_mat_mult_opt_q31() 519 if (numColsB & 1u) { in arm_mat_mult_opt_q31() 521 px = pDst->pData + numColsB - 1; in arm_mat_mult_opt_q31() 535 pInB = pSrcBT + numRowsB * (numColsB - 1); in arm_mat_mult_opt_q31() [all …]
|
D | arm_mat_mult_q7.c | 283 uint32_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_q7() local 308 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q7() 320 BT.numRows = numColsB; in arm_mat_mult_q7() 332 px2 = px + numColsB; in arm_mat_mult_q7() 346 col = numColsB >> 1; in arm_mat_mult_q7() 434 px = px2 + (numColsB & 1u); in arm_mat_mult_q7() 435 px2 = px + numColsB; in arm_mat_mult_q7() 446 if (numColsB & 1u) in arm_mat_mult_q7() 449 px = pDst->pData + numColsB - 1; in arm_mat_mult_q7() 464 pInB = pSrcBT + numRowsB * (numColsB - 1); in arm_mat_mult_q7() [all …]
|
D | arm_mat_mult_q15.c | 335 uint32_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_mult_q15() local 358 if (numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q15() 377 BT.numRows = numColsB; in arm_mat_mult_q15() 390 px2 = px + numColsB; in arm_mat_mult_q15() 403 col = numColsB >> 1; in arm_mat_mult_q15() 488 px = px2 + (numColsB & 1u); in arm_mat_mult_q15() 489 px2 = px + numColsB; in arm_mat_mult_q15() 500 if (numColsB & 1u) { in arm_mat_mult_q15() 502 px = pDst->pData + numColsB - 1; in arm_mat_mult_q15() 516 pInB = pSrcBT + numRowsB * (numColsB - 1); in arm_mat_mult_q15() [all …]
|
D | arm_mat_cmplx_mult_q31.c | 527 uint16_t numColsB = pSrcB->numCols; /* number of columns of input matrix B */ in arm_mat_cmplx_mult_q31() local 551 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_q31() 576 vecColBOffs[2] = numColsB * CMPLX_DIM; in arm_mat_cmplx_mult_q31() 577 vecColBOffs[3] = (numColsB * CMPLX_DIM) + 1; in arm_mat_cmplx_mult_q31() 593 i = i + 2 * numColsB; in arm_mat_cmplx_mult_q31() 597 col = numColsB; in arm_mat_cmplx_mult_q31() 643 vecOffs = vecOffs + (uint32_t) (numColsB * 2 * CMPLX_DIM); in arm_mat_cmplx_mult_q31() 677 vecOffs = vecOffs + (uint32_t) (numColsB * 2 * CMPLX_DIM); in arm_mat_cmplx_mult_q31() 690 px[0 * CMPLX_DIM * numColsB + 0] = (q31_t) clip_q63_to_q31(acc0 >> 31); in arm_mat_cmplx_mult_q31() 691 px[0 * CMPLX_DIM * numColsB + 1] = (q31_t) clip_q63_to_q31(acc1 >> 31); in arm_mat_cmplx_mult_q31() [all …]
|
/cmsis-dsp-latest/dsppp/Include/dsppp/Helium/ |
D | matrix_multiply.hpp | 98 int numColsB = pSrcB.columns(); /* number of columns of input matrix B */ 105 if(numRowsA == numColsB && numColsB == numColsA) { 136 uint32_t k = numColsB / nb_lanes; 188 int colBLeft = numColsB & (nb_lanes - 1); 255 uint32_t k = numColsB / nb_lanes; 289 int colBLeft = numColsB & (nb_lanes-1);
|
D | matrix_multiply_fixed.hpp | 335 uint32_t numColsB = pSrcB.columns(); /* number of columns of input matrix B */ 351 if (numRowsA == numColsB && numColsB == numColsA) { 390 col = numColsB >> 1; 476 px = px2 + (numColsB & 1u); 488 if (numColsB & 1u) { 506 pInB = pSrcBT + numRowsB * (numColsB - 1); 547 col = numColsB;
|
/cmsis-dsp-latest/dsppp/Include/dsppp/Scalar/ |
D | matrix_multiply_fixed.hpp | 45 uint16_t numColsB = pSrcB.columns(); /* Number of columns of input matrix B */ in _dot_m_m() local 58 col = numColsB; in _dot_m_m() 121 pIn2 = pInB + (numColsB - col) ; in _dot_m_m()
|
D | matrix_multiply_float.hpp | 40 uint16_t numColsB = pSrcB.columns(); /* Number of columns of input matrix B */ in _dot_m_m() local 53 col = numColsB; in _dot_m_m() 115 pIn2 = pInB + (numColsB - col); in _dot_m_m()
|
/cmsis-dsp-latest/dsppp/Include/dsppp/DSP/ |
D | matrix_multiply.hpp | 276 uint16_t numColsB = pSrcB.columns(); /* Number of columns of input matrix B */ in _dot_m_m() local 294 col = numColsB; in _dot_m_m()
|