| /cmsis-dsp-latest/Source/MatrixFunctions/ |
| D | arm_mat_mult_f64.c | 83 uint32_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_f64() local 154 pIn1B = pIn1 + numColsA; in arm_mat_mult_f64() 155 pIn1C = pIn1 + 2*numColsA; in arm_mat_mult_f64() 156 pIn1D = pIn1 + 3*numColsA; in arm_mat_mult_f64() 157 pIn1E = pIn1 + 4*numColsA; in arm_mat_mult_f64() 158 pIn1F = pIn1 + 5*numColsA; in arm_mat_mult_f64() 159 pIn1G = pIn1 + 6*numColsA; in arm_mat_mult_f64() 160 pIn1H = pIn1 + 7*numColsA; in arm_mat_mult_f64() 172 colCnt = numColsA >> 1U; in arm_mat_mult_f64() 226 colCnt = numColsA & 1; in arm_mat_mult_f64() [all …]
|
| D | arm_mat_mult_f32.c | 296 int numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_f32() local 314 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_f32() 350 pInA1 = pInA0 + numColsA; in arm_mat_mult_f32() 351 pInA2 = pInA1 + numColsA; in arm_mat_mult_f32() 352 pInA3 = pInA2 + numColsA; in arm_mat_mult_f32() 359 blkCnt = numColsA; in arm_mat_mult_f32() 393 pInB0 -= (numColsB * numColsA) - 4; in arm_mat_mult_f32() 401 pInA1 = pInA0 + numColsA; in arm_mat_mult_f32() 402 pInA2 = pInA1 + numColsA; in arm_mat_mult_f32() 403 pInA3 = pInA2 + numColsA; in arm_mat_mult_f32() [all …]
|
| D | arm_mat_mult_f16.c | 392 int numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_f16() local 412 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_f16() 443 pInA1 = pInA0 + numColsA; in arm_mat_mult_f16() 444 pInA2 = pInA1 + numColsA; in arm_mat_mult_f16() 445 pInA3 = pInA2 + numColsA; in arm_mat_mult_f16() 452 blkCnt = numColsA; in arm_mat_mult_f16() 481 pInB0 -= (numColsB * numColsA) - 8; in arm_mat_mult_f16() 489 pInA1 = pInA0 + numColsA; in arm_mat_mult_f16() 490 pInA2 = pInA1 + numColsA; in arm_mat_mult_f16() 491 pInA3 = pInA2 + numColsA; in arm_mat_mult_f16() [all …]
|
| D | arm_mat_mult_fast_q15.c | 80 uint16_t numColsA = pSrcA->numCols; /* Number of columns of input matrix A */ in arm_mat_mult_fast_q15() local 258 pInA2 = pInA + numColsA; in arm_mat_mult_fast_q15() 262 colCnt = numColsA >> 1U; in arm_mat_mult_fast_q15() 264 colCnt = numColsA >> 2U; in arm_mat_mult_fast_q15() 311 if (numColsA & 1U) { in arm_mat_mult_fast_q15() 322 colCnt = numColsA % 0x4U; in arm_mat_mult_fast_q15() 349 i = i + numColsA; in arm_mat_mult_fast_q15() 352 i = i + numColsA; in arm_mat_mult_fast_q15() 387 colCnt = numColsA >> 2U; in arm_mat_mult_fast_q15() 404 colCnt = numColsA & 3U; in arm_mat_mult_fast_q15() [all …]
|
| D | arm_mat_mult_fast_q31.c | 80 uint16_t numColsA = pSrcA->numCols; /* Number of columns of input matrix A */ in arm_mat_mult_fast_q31() local 131 pInA2 = pInA + numColsA; in arm_mat_mult_fast_q31() 133 colCnt = numColsA; in arm_mat_mult_fast_q31() 174 i = i + (numColsA << 1U); in arm_mat_mult_fast_q31() 207 colCnt = numColsA >> 2U; in arm_mat_mult_fast_q31() 245 colCnt = numColsA % 4U; in arm_mat_mult_fast_q31() 250 colCnt = numColsA; in arm_mat_mult_fast_q31() 288 pInA = pSrcA->pData + (numRowsA-1) * numColsA; in arm_mat_mult_fast_q31() 297 colCnt = numColsA >> 2U; in arm_mat_mult_fast_q31() 335 colCnt = numColsA % 4U; in arm_mat_mult_fast_q31() [all …]
|
| D | arm_mat_mult_q15.c | 336 uint32_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_q15() local 358 if (numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q15() 424 pInA2 = pInA + numColsA; in arm_mat_mult_q15() 442 blkCnt = numColsA / 8; in arm_mat_mult_q15() 462 blkCnt = numColsA & 7; in arm_mat_mult_q15() 487 i = i + numColsA * 2; in arm_mat_mult_q15() 523 blkCnt = (numColsA) / 8; in arm_mat_mult_q15() 536 blkCnt = (numColsA & 7); in arm_mat_mult_q15() 548 i += numColsA; in arm_mat_mult_q15() 574 pInA = pSrcA->pData + (numRowsA - 1) * numColsA; in arm_mat_mult_q15() [all …]
|
| D | arm_mat_mult_opt_q31.c | 354 uint32_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_opt_q31() local 373 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_opt_q31() 434 pInA2 = pInA + numColsA; in arm_mat_mult_opt_q31() 453 blkCnt = (numColsA / 4); in arm_mat_mult_opt_q31() 474 blkCnt = (numColsA & 3); in arm_mat_mult_opt_q31() 507 i = i + numColsA * 2; in arm_mat_mult_opt_q31() 543 blkCnt = (numColsA / 4); in arm_mat_mult_opt_q31() 557 blkCnt = (numColsA & 3); in arm_mat_mult_opt_q31() 570 i += numColsA; in arm_mat_mult_opt_q31() 596 pInA = pSrcA->pData + (numRowsA - 1) * numColsA; in arm_mat_mult_opt_q31() [all …]
|
| D | arm_mat_mult_q7.c | 284 uint32_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_q7() local 308 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q7() 368 pInA2 = pInA + numColsA; in arm_mat_mult_q7() 385 blkCnt = numColsA >> 4; in arm_mat_mult_q7() 407 blkCnt = numColsA & 0xF; in arm_mat_mult_q7() 433 i = i + numColsA * 2; in arm_mat_mult_q7() 471 blkCnt = (numColsA) >> 4; in arm_mat_mult_q7() 486 blkCnt = numColsA & 0xF; in arm_mat_mult_q7() 499 i += numColsA; in arm_mat_mult_q7() 527 pInA = pSrcA->pData + (numRowsA - 1) * numColsA; in arm_mat_mult_q7() [all …]
|
| D | arm_mat_mult_q31.c | 346 uint16_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_mult_q31() local 368 if(numRowsA == numColsB && numColsB == numColsA) { in arm_mat_mult_q31() 424 q31_t const *pInA1 = pInA0 + numColsA; in arm_mat_mult_q31() 425 q31_t const *pInA2 = pInA1 + numColsA; in arm_mat_mult_q31() 426 q31_t const *pInA3 = pInA2 + numColsA; in arm_mat_mult_q31() 442 blkCnt = numColsA >> 2; in arm_mat_mult_q31() 466 blkCnt = numColsA & 3; in arm_mat_mult_q31() 508 pInA += (numColsA * 4); in arm_mat_mult_q31() 556 blkCnt = numColsA >> 2; in arm_mat_mult_q31() 575 blkCnt = numColsA & 3; in arm_mat_mult_q31() [all …]
|
| D | arm_mat_cmplx_mult_q15.c | 76 uint32_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_cmplx_mult_q15() local 167 blkCnt = (numColsA * CMPLX_DIM) >> 3; in arm_mat_cmplx_mult_q15() 191 blkCnt = (numColsA * CMPLX_DIM) & 7; in arm_mat_cmplx_mult_q15() 260 blkCnt = (numColsA * CMPLX_DIM) >> 3; in arm_mat_cmplx_mult_q15() 280 blkCnt = (numColsA * CMPLX_DIM) & 7; in arm_mat_cmplx_mult_q15() 299 i = i + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_q15() 327 uint16_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_cmplx_mult_q15() local 454 colCnt = numColsA >> 1U; in arm_mat_cmplx_mult_q15() 531 if ((numColsA & 0x1U) > 0U) in arm_mat_cmplx_mult_q15() 577 i = i + numColsA; in arm_mat_cmplx_mult_q15()
|
| D | arm_mat_cmplx_mult_f16.c | 392 uint16_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_cmplx_mult_f16() local 417 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_f16() 480 float16_t const *pInA1 = pInA0 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 481 float16_t const *pInA2 = pInA1 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 482 float16_t const *pInA3 = pInA2 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 500 blkCnt = (numColsA * CMPLX_DIM) >> 3; in arm_mat_cmplx_mult_f16() 536 blkCnt = (numColsA * CMPLX_DIM) & 7; in arm_mat_cmplx_mult_f16() 586 pInA += (numColsA * 4) * CMPLX_DIM; in arm_mat_cmplx_mult_f16() 636 blkCnt = (numColsA * CMPLX_DIM) >> 3; in arm_mat_cmplx_mult_f16() 660 blkCnt = (numColsA * CMPLX_DIM) & 7; in arm_mat_cmplx_mult_f16() [all …]
|
| D | arm_mat_cmplx_mult_f32.c | 534 uint16_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_cmplx_mult_f32() local 558 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_f32() 617 float32_t const *pInA1 = pInA0 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f32() 618 float32_t const *pInA2 = pInA1 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f32() 619 float32_t const *pInA3 = pInA2 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_f32() 637 blkCnt = (numColsA * CMPLX_DIM) >> 2; in arm_mat_cmplx_mult_f32() 669 blkCnt = (numColsA * CMPLX_DIM) & 3; in arm_mat_cmplx_mult_f32() 718 pInA += (numColsA * 4) * CMPLX_DIM; in arm_mat_cmplx_mult_f32() 768 blkCnt = (numColsA * CMPLX_DIM) >> 2; in arm_mat_cmplx_mult_f32() 792 blkCnt = (numColsA * CMPLX_DIM) & 3; in arm_mat_cmplx_mult_f32() [all …]
|
| D | arm_mat_cmplx_mult_q31.c | 528 uint16_t numColsA = pSrcA->numCols; /* number of columns of input matrix A */ in arm_mat_cmplx_mult_q31() local 551 if (numRowsA == numColsB && numColsB == numColsA) in arm_mat_cmplx_mult_q31() 617 q31_t const *pInA1 = pInA0 + numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_q31() 634 blkCnt = (numColsA * CMPLX_DIM) >> 2; in arm_mat_cmplx_mult_q31() 666 blkCnt = (numColsA * CMPLX_DIM) & 3; in arm_mat_cmplx_mult_q31() 708 pInA += (numColsA * 2) * CMPLX_DIM; in arm_mat_cmplx_mult_q31() 759 blkCnt = (numColsA * CMPLX_DIM) >> 2; in arm_mat_cmplx_mult_q31() 783 blkCnt = (numColsA * CMPLX_DIM) & 3; in arm_mat_cmplx_mult_q31() 823 pInA += numColsA * CMPLX_DIM; in arm_mat_cmplx_mult_q31() 849 uint16_t numColsA = pSrcA->numCols; /* Number of columns of input matrix A */ in arm_mat_cmplx_mult_q31() local [all …]
|
| /cmsis-dsp-latest/dsppp/Include/dsppp/Helium/ |
| D | matrix_multiply.hpp | 99 int numColsA = pSrcA.columns(); /* number of columns of input matrix A */ 105 if(numRowsA == numColsB && numColsB == numColsA) { 150 blkCnt = numColsA; 184 pInB0 -= (pSrcB.stride() * numColsA) - nb_lanes; 203 blkCnt = numColsA; 261 blkCnt = numColsA; 285 pInB0 -= (pSrcB.stride() * numColsA) - nb_lanes; 296 blkCnt = numColsA;
|
| D | matrix_multiply_fixed.hpp | 336 uint32_t numColsA = pSrcA.columns(); /* number of columns of input matrix A */ 351 if (numRowsA == numColsB && numColsB == numColsA) { 429 blkCnt = numColsA / nb_lanes; 449 blkCnt = numColsA & (nb_lanes-1); 513 blkCnt = (numColsA) / nb_lanes; 526 blkCnt = (numColsA & (nb_lanes-1)); 575 blkCnt = ((numColsA) / nb_lanes); 588 blkCnt = (numColsA & 7); 598 i += numColsA;
|
| /cmsis-dsp-latest/dsppp/Include/dsppp/Scalar/ |
| D | matrix_multiply_fixed.hpp | 46 uint16_t numColsA = pSrcA.columns(); /* Number of columns of input matrix A */ in _dot_m_m() local 74 colCnt = numColsA >> 2U; in _dot_m_m() 99 colCnt = numColsA % 0x4U; in _dot_m_m()
|
| D | matrix_multiply_float.hpp | 41 uint16_t numColsA = pSrcA.columns(); /* Number of columns of input matrix A */ in _dot_m_m() local 69 colCnt = numColsA >> 2U; in _dot_m_m() 94 colCnt = numColsA % 0x4U; in _dot_m_m()
|
| /cmsis-dsp-latest/dsppp/Include/dsppp/DSP/ |
| D | matrix_multiply.hpp | 277 uint16_t numColsA = pSrcA.columns(); /* Number of columns of input matrix A */ in _dot_m_m() local 309 colCnt = numColsA / (2*nb_lanes); in _dot_m_m() 336 colCnt = numColsA & (2*nb_lanes-1); in _dot_m_m()
|