/third_party/cmsis/CMSIS/DSP/Source/MatrixFunctions/ |
D | arm_mat_mult_fast_q31.c | 72 q31_t *pInB = pSrcB->pData; /* Input data matrix pointer B */ in arm_mat_mult_fast_q31() local 113 pInB = pSrcB->pData; in arm_mat_mult_fast_q31() 130 pInB = pSrcB->pData + j; in arm_mat_mult_fast_q31() 141 inB1 = pInB[0]; in arm_mat_mult_fast_q31() 143 inB2 = pInB[1]; in arm_mat_mult_fast_q31() 144 pInB += numColsB; in arm_mat_mult_fast_q31() 199 pInB = pSrcB->pData + numColsB-1; in arm_mat_mult_fast_q31() 213 sum1 = __SMMLA(*pInA++, *pInB, sum1); in arm_mat_mult_fast_q31() 215 sum1 = (q31_t) ((((q63_t) sum1 << 32) + ((q63_t) *pInA++ * *pInB)) >> 32); in arm_mat_mult_fast_q31() 217 pInB += numColsB; in arm_mat_mult_fast_q31() [all …]
|
D | arm_mat_mult_fast_q15.c | 76 q15_t *pInB = pSrcB->pData; /* Input data matrix pointer B of Q15 type */ in arm_mat_mult_fast_q15() local 128 in = read_q15x2_ia (&pInB); in arm_mat_mult_fast_q15() 150 in = read_q15x2_ia (&pInB); in arm_mat_mult_fast_q15() 168 in = *pInB++; in arm_mat_mult_fast_q15() 176 in = *pInB++; in arm_mat_mult_fast_q15() 180 in = *pInB++; in arm_mat_mult_fast_q15() 184 in = *pInB++; in arm_mat_mult_fast_q15() 201 *px = *pInB++; in arm_mat_mult_fast_q15() 236 pInB = pSrcBT; in arm_mat_mult_fast_q15() 257 pInB = pSrcBT + j; in arm_mat_mult_fast_q15() [all …]
|
D | arm_mat_mult_q7.c | 65 q7_t const *pInB = (q7_t const *)pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q7_2x2_mve() local 77 pInB = pSrcB->pData; in arm_mat_mult_q7_2x2_mve() 79 vecB = vldrbq_gather_offset_z(pInB, vecColBOffs, p0); in arm_mat_mult_q7_2x2_mve() 92 pInB = pInB + 1; in arm_mat_mult_q7_2x2_mve() 94 vecB = vldrbq_gather_offset_z(pInB, vecColBOffs, p0); in arm_mat_mult_q7_2x2_mve() 114 q7_t const *pInB = (q7_t const *)pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q7_3x3_mve() local 128 pInB = pSrcB->pData; in arm_mat_mult_q7_3x3_mve() 130 vecB = vldrbq_gather_offset_z(pInB, vecColBOffs, p0); in arm_mat_mult_q7_3x3_mve() 146 pInB = pInB + 1; in arm_mat_mult_q7_3x3_mve() 148 vecB = vldrbq_gather_offset_z(pInB, vecColBOffs, p0); in arm_mat_mult_q7_3x3_mve() [all …]
|
D | arm_mat_mult_q15.c | 76 q15_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q15_2x2_mve() local 88 pInB = pSrcB->pData; in arm_mat_mult_q15_2x2_mve() 90 vecB = vldrhq_gather_shifted_offset_z_s16((q15_t const *)pInB, vecColBOffs, p0); in arm_mat_mult_q15_2x2_mve() 106 pInB = pInB + 1; in arm_mat_mult_q15_2x2_mve() 108 vecB = vldrhq_gather_shifted_offset_z_s16(pInB, vecColBOffs, p0); in arm_mat_mult_q15_2x2_mve() 132 q15_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q15_3x3_mve() local 146 pInB = pSrcB->pData; in arm_mat_mult_q15_3x3_mve() 148 vecB = vldrhq_gather_shifted_offset_z_s16((q15_t const *)pInB, vecColBOffs, p0); in arm_mat_mult_q15_3x3_mve() 168 pInB = pInB + 1; in arm_mat_mult_q15_3x3_mve() 170 vecB = vldrhq_gather_shifted_offset_z_s16(pInB, vecColBOffs, p0); in arm_mat_mult_q15_3x3_mve() [all …]
|
D | arm_mat_mult_q31.c | 72 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q31_2x2_mve() local 86 pInB = pSrcB->pData; in arm_mat_mult_q31_2x2_mve() 89 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_q31_2x2_mve() 106 pInB = pInB + 1; in arm_mat_mult_q31_2x2_mve() 108 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_q31_2x2_mve() 131 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_q31_3x3_mve() local 146 pInB = pSrcB->pData; in arm_mat_mult_q31_3x3_mve() 148 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_q31_3x3_mve() 167 pInB = pInB + 1; in arm_mat_mult_q31_3x3_mve() 169 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_q31_3x3_mve() [all …]
|
D | arm_mat_cmplx_mult_q15.c | 71 … q15_t const *pInB = (q15_t const *) pSrcB->pData; /* input data matrix pointer B of Q15 type */ in arm_mat_cmplx_mult_q15() local 143 pInB = pSrcB->pData + j; in arm_mat_cmplx_mult_q15() 144 pInB2 = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_q15() 172 vecB = vldrhq_gather_shifted_offset(pInB, vecOffs); in arm_mat_cmplx_mult_q15() 195 vecB = vldrhq_gather_shifted_offset(pInB, vecOffs); in arm_mat_cmplx_mult_q15() 237 pInB = pSrcB->pData + j; in arm_mat_cmplx_mult_q15() 265 vecB = vldrhq_gather_shifted_offset(pInB, vecOffs); in arm_mat_cmplx_mult_q15() 284 vecB = vldrhq_gather_shifted_offset(pInB, vecOffs); in arm_mat_cmplx_mult_q15() 323 q15_t *pInB = pSrcB->pData; /* input data matrix pointer B of Q15 type */ in arm_mat_cmplx_mult_q15() local 371 write_q15x2 (px, read_q15x2_ia (&pInB)); in arm_mat_cmplx_mult_q15() [all …]
|
D | arm_mat_mult_opt_q31.c | 76 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_opt_q31_2x2_mve() local 90 pInB = pSrcB->pData; in arm_mat_mult_opt_q31_2x2_mve() 93 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_opt_q31_2x2_mve() 110 pInB = pInB + 1; in arm_mat_mult_opt_q31_2x2_mve() 112 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_opt_q31_2x2_mve() 135 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_opt_q31_3x3_mve() local 150 pInB = pSrcB->pData; in arm_mat_mult_opt_q31_3x3_mve() 152 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_opt_q31_3x3_mve() 171 pInB = pInB + 1; in arm_mat_mult_opt_q31_3x3_mve() 173 vecB = vldrwq_gather_shifted_offset_z_s32(pInB, vecColBOffs, p0); in arm_mat_mult_opt_q31_3x3_mve() [all …]
|
D | arm_mat_cmplx_mult_f16.c | 71 float16_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_f16_2x2_mve() local 96 pInB = (float16_t const *)pSrcB->pData; in arm_mat_cmplx_mult_f16_2x2_mve() 102 vecB = vldrhq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_f16_2x2_mve() 145 float16_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_f16_3x3_mve() local 166 pInB = (float16_t const *)pSrcB->pData; in arm_mat_cmplx_mult_f16_3x3_mve() 172 vecB = vldrhq_gather_shifted_offset_z(pInB, vecColBOffs0, p0); in arm_mat_cmplx_mult_f16_3x3_mve() 190 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_f16_3x3_mve() 192 vecB = vldrhq_gather_shifted_offset_z(pInB, vecColBOffs0, p0); in arm_mat_cmplx_mult_f16_3x3_mve() 210 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_f16_3x3_mve() 212 vecB = vldrhq_gather_shifted_offset_z(pInB, vecColBOffs0, p0); in arm_mat_cmplx_mult_f16_3x3_mve() [all …]
|
D | arm_mat_cmplx_mult_q31.c | 72 q31_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_q31_2x2_mve() local 88 pInB = (q31_t const *) pSrcB->pData; in arm_mat_cmplx_mult_q31_2x2_mve() 90 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_q31_2x2_mve() 106 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_q31_2x2_mve() 108 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_q31_2x2_mve() 134 q31_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_q31_3x3_mve() local 160 pInB = (q31_t const *) pSrcB->pData; in arm_mat_cmplx_mult_q31_3x3_mve() 162 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_q31_3x3_mve() 163 vecB1 = vldrwq_gather_shifted_offset(pInB, vecColBOffs1); in arm_mat_cmplx_mult_q31_3x3_mve() 201 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_q31_3x3_mve() [all …]
|
D | arm_mat_cmplx_mult_f32.c | 76 float32_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_f32_2x2_mve() local 91 pInB = (float32_t const *)pSrcB->pData; in arm_mat_cmplx_mult_f32_2x2_mve() 93 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_f32_2x2_mve() 112 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_f32_2x2_mve() 114 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_f32_2x2_mve() 140 float32_t const *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_cmplx_mult_f32_3x3_mve() local 162 pInB = (float32_t const *)pSrcB->pData; in arm_mat_cmplx_mult_f32_3x3_mve() 164 vecB = vldrwq_gather_shifted_offset(pInB, vecColBOffs0); in arm_mat_cmplx_mult_f32_3x3_mve() 179 vecB = vldrwq_gather_shifted_offset_z(pInB, vecColBOffs1, p0); in arm_mat_cmplx_mult_f32_3x3_mve() 205 pInB = pInB + CMPLX_DIM; in arm_mat_cmplx_mult_f32_3x3_mve() [all …]
|
D | arm_mat_sub_q15.c | 134 q15_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_sub_q15() local 170 write_q15x2_ia (&pOut, __QSUB16(read_q15x2_ia (&pInA), read_q15x2_ia (&pInB))); in arm_mat_sub_q15() 171 write_q15x2_ia (&pOut, __QSUB16(read_q15x2_ia (&pInA), read_q15x2_ia (&pInB))); in arm_mat_sub_q15() 173 *pOut++ = (q15_t) __SSAT(((q31_t) * pInA++ - *pInB++), 16); in arm_mat_sub_q15() 174 *pOut++ = (q15_t) __SSAT(((q31_t) * pInA++ - *pInB++), 16); in arm_mat_sub_q15() 175 *pOut++ = (q15_t) __SSAT(((q31_t) * pInA++ - *pInB++), 16); in arm_mat_sub_q15() 176 *pOut++ = (q15_t) __SSAT(((q31_t) * pInA++ - *pInB++), 16); in arm_mat_sub_q15() 199 *pOut++ = (q15_t) __QSUB16(*pInA++, *pInB++); in arm_mat_sub_q15() 201 *pOut++ = (q15_t) __SSAT(((q31_t) * pInA++ - *pInB++), 16); in arm_mat_sub_q15()
|
D | arm_mat_add_q15.c | 137 q15_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_add_q15() local 174 write_q15x2_ia (&pOut, __QADD16(read_q15x2_ia (&pInA), read_q15x2_ia (&pInB))); in arm_mat_add_q15() 176 write_q15x2_ia (&pOut, __QADD16(read_q15x2_ia (&pInA), read_q15x2_ia (&pInB))); in arm_mat_add_q15() 178 *pOut++ = (q15_t) __SSAT(((q31_t) *pInA++ + *pInB++), 16); in arm_mat_add_q15() 180 *pOut++ = (q15_t) __SSAT(((q31_t) *pInA++ + *pInB++), 16); in arm_mat_add_q15() 182 *pOut++ = (q15_t) __SSAT(((q31_t) *pInA++ + *pInB++), 16); in arm_mat_add_q15() 184 *pOut++ = (q15_t) __SSAT(((q31_t) *pInA++ + *pInB++), 16); in arm_mat_add_q15() 207 *pOut++ = (q15_t) __QADD16(*pInA++, *pInB++); in arm_mat_add_q15() 209 *pOut++ = (q15_t) __SSAT(((q31_t) *pInA++ + *pInB++), 16); in arm_mat_add_q15()
|
D | arm_mat_sub_f64.c | 57 float64_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_sub_f64() local 93 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f64() 94 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f64() 95 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f64() 96 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f64() 117 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f64()
|
D | arm_mat_sub_f16.c | 135 float16_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_sub_f16() local 171 *pOut++ = (_Float16)(*pInA++) - (_Float16)(*pInB++); in arm_mat_sub_f16() 172 *pOut++ = (_Float16)(*pInA++) - (_Float16)(*pInB++); in arm_mat_sub_f16() 173 *pOut++ = (_Float16)(*pInA++) - (_Float16)(*pInB++); in arm_mat_sub_f16() 174 *pOut++ = (_Float16)(*pInA++) - (_Float16)(*pInB++); in arm_mat_sub_f16() 195 *pOut++ = (_Float16)(*pInA++) - (_Float16)(*pInB++); in arm_mat_sub_f16()
|
D | arm_mat_sub_q31.c | 138 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_sub_q31() local 174 *pOut++ = __QSUB(*pInA++, *pInB++); in arm_mat_sub_q31() 176 *pOut++ = __QSUB(*pInA++, *pInB++); in arm_mat_sub_q31() 178 *pOut++ = __QSUB(*pInA++, *pInB++); in arm_mat_sub_q31() 180 *pOut++ = __QSUB(*pInA++, *pInB++); in arm_mat_sub_q31() 201 *pOut++ = __QSUB(*pInA++, *pInB++); in arm_mat_sub_q31()
|
D | arm_mat_add_f16.c | 134 float16_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_add_f16() local 170 *pOut++ = (_Float16)*pInA++ + (_Float16)*pInB++; in arm_mat_add_f16() 172 *pOut++ = (_Float16)*pInA++ + (_Float16)*pInB++; in arm_mat_add_f16() 174 *pOut++ = (_Float16)*pInA++ + (_Float16)*pInB++; in arm_mat_add_f16() 176 *pOut++ = (_Float16)*pInA++ + (_Float16)*pInB++; in arm_mat_add_f16() 197 *pOut++ = (_Float16)*pInA++ + (_Float16)*pInB++; in arm_mat_add_f16()
|
D | arm_mat_add_q31.c | 136 q31_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_add_q31() local 172 *pOut++ = __QADD(*pInA++, *pInB++); in arm_mat_add_q31() 174 *pOut++ = __QADD(*pInA++, *pInB++); in arm_mat_add_q31() 176 *pOut++ = __QADD(*pInA++, *pInB++); in arm_mat_add_q31() 178 *pOut++ = __QADD(*pInA++, *pInB++); in arm_mat_add_q31() 199 *pOut++ = __QADD(*pInA++, *pInB++); in arm_mat_add_q31()
|
D | arm_mat_sub_f32.c | 239 float32_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_sub_f32() local 275 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f32() 276 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f32() 277 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f32() 278 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f32() 299 *pOut++ = (*pInA++) - (*pInB++); in arm_mat_sub_f32()
|
D | arm_mat_add_f32.c | 243 float32_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_add_f32() local 279 *pOut++ = *pInA++ + *pInB++; in arm_mat_add_f32() 281 *pOut++ = *pInA++ + *pInB++; in arm_mat_add_f32() 283 *pOut++ = *pInA++ + *pInB++; in arm_mat_add_f32() 285 *pOut++ = *pInA++ + *pInB++; in arm_mat_add_f32() 306 *pOut++ = *pInA++ + *pInB++; in arm_mat_add_f32()
|
D | arm_mat_mult_f32.c | 145 float32_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_f32_3x3_mve() local 153 pSrBVec = (float32_t const *) pInB; in arm_mat_mult_f32_3x3_mve() 210 float32_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_f32_4x4_mve() local 217 pSrBVec = (float32_t const *) pInB; in arm_mat_mult_f32_4x4_mve() 291 float32_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_f32() local 317 pOut[0] = pInA[0] * pInB[0]; in arm_mat_mult_f32() 343 pInB0 = pInB; in arm_mat_mult_f32() 461 pInB0 = pInB; in arm_mat_mult_f32() 892 float32_t *pInB = pSrcB->pData; /* Input data matrix pointer B */ in arm_mat_mult_f32() local 995 pIn2 = pInB + (numColsB - col); in arm_mat_mult_f32()
|
D | arm_mat_mult_f16.c | 387 float16_t *pInB = pSrcB->pData; /* input data matrix pointer B */ in arm_mat_mult_f16() local 436 pInB0 = pInB; in arm_mat_mult_f16() 548 pInB0 = pInB; in arm_mat_mult_f16() 632 float16_t *pInB = pSrcB->pData; /* Input data matrix pointer B */ in arm_mat_mult_f16() local 735 pIn2 = pInB + (numColsB - col); in arm_mat_mult_f16()
|
D | arm_mat_mult_f64.c | 384 float64_t *pInB = pSrcB->pData; /* Input data matrix pointer B */ in arm_mat_mult_f64() local 487 pIn2 = pInB + (numColsB - col); in arm_mat_mult_f64()
|
/third_party/cmsis/CMSIS/DSP/Source/StatisticsFunctions/ |
D | arm_kullback_leibler_f32.c | 113 const float32_t *pInA, *pInB; in arm_kullback_leibler_f32() local 122 pInB = pSrcB; in arm_kullback_leibler_f32() 133 tmpVB = vld1q_f32(pInB); in arm_kullback_leibler_f32() 134 pInB += 4; in arm_kullback_leibler_f32() 153 pB = *pInB++; in arm_kullback_leibler_f32() 166 const float32_t *pInA, *pInB; in arm_kullback_leibler_f32() local 171 pInB = pSrcB; in arm_kullback_leibler_f32() 179 pB = *pInB++; in arm_kullback_leibler_f32()
|
D | arm_kullback_leibler_f64.c | 51 const float64_t *pInA, *pInB; in arm_kullback_leibler_f64() local 56 pInB = pSrcB; in arm_kullback_leibler_f64() 64 pB = *pInB++; in arm_kullback_leibler_f64()
|
D | arm_kullback_leibler_f16.c | 123 const float16_t *pInA, *pInB; in arm_kullback_leibler_f16() local 128 pInB = pSrcB; in arm_kullback_leibler_f16() 136 pB = *pInB++; in arm_kullback_leibler_f16()
|