/third_party/cmsis/CMSIS/DSP/Source/SupportFunctions/ |
D | arm_weighted_sum_f32.c | 57 float32_t accum1, accum2; in arm_weighted_sum_f32() local 86 accum2 = vecAddAcrossF32Mve(accum2V); in arm_weighted_sum_f32() 92 accum2 += *pW++; in arm_weighted_sum_f32() 97 return (accum1 / accum2); in arm_weighted_sum_f32() 107 float32_t accum1, accum2; in arm_weighted_sum_f32() local 121 accum2=0.0f; in arm_weighted_sum_f32() 144 accum2 = vget_lane_f32(tempV, 0) + vget_lane_f32(tempV, 1); in arm_weighted_sum_f32() 150 accum2 += *pW++; in arm_weighted_sum_f32() 155 return(accum1 / accum2); in arm_weighted_sum_f32() 161 float32_t accum1, accum2; in arm_weighted_sum_f32() local [all …]
|
D | arm_weighted_sum_f16.c | 70 _Float16 accum1, accum2; in arm_weighted_sum_f16() local 99 accum2 = vecAddAcrossF16Mve(accum2V); in arm_weighted_sum_f16() 105 accum2 += (_Float16)*pW++; in arm_weighted_sum_f16() 110 return (accum1 / accum2); in arm_weighted_sum_f16() 118 _Float16 accum1, accum2; in arm_weighted_sum_f16() local 127 accum2=0.0f16; in arm_weighted_sum_f16() 133 accum2 += (_Float16)*pW++; in arm_weighted_sum_f16() 137 return(accum1 / accum2); in arm_weighted_sum_f16()
|
/third_party/openssl/crypto/ec/curve448/arch_32/ |
D | f_impl.c | 19 uint64_t accum0 = 0, accum1 = 0, accum2 = 0; in gf_mul() local 30 accum2 = 0; in gf_mul() 32 accum2 += widemul(a[j - i], b[i]); in gf_mul() 36 accum1 -= accum2; in gf_mul() 37 accum0 += accum2; in gf_mul() 38 accum2 = 0; in gf_mul() 41 accum2 += widemul(aa[8 + j - i], bb[i]); in gf_mul() 44 accum1 += accum2; in gf_mul() 45 accum0 += accum2; in gf_mul()
|
/third_party/cmsis/CMSIS/DSP/Source/SVMFunctions/ |
D | arm_svm_linear_predict_f32.c | 297 float32x2_t accum2; in arm_svm_linear_predict_f32() local 354 accum2 = vpadd_f32(vget_low_f32(accuma),vget_high_f32(accuma)); in arm_svm_linear_predict_f32() 355 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,0); in arm_svm_linear_predict_f32() 357 accum2 = vpadd_f32(vget_low_f32(accumb),vget_high_f32(accumb)); in arm_svm_linear_predict_f32() 358 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,1); in arm_svm_linear_predict_f32() 360 accum2 = vpadd_f32(vget_low_f32(accumc),vget_high_f32(accumc)); in arm_svm_linear_predict_f32() 361 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,2); in arm_svm_linear_predict_f32() 363 accum2 = vpadd_f32(vget_low_f32(accumd),vget_high_f32(accumd)); in arm_svm_linear_predict_f32() 364 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,3); in arm_svm_linear_predict_f32() 384 accum2 = vpadd_f32(vget_low_f32(accum),vget_high_f32(accum)); in arm_svm_linear_predict_f32() [all …]
|
D | arm_svm_polynomial_predict_f32.c | 317 float32x2_t accum2; in arm_svm_polynomial_predict_f32() local 374 accum2 = vpadd_f32(vget_low_f32(accuma),vget_high_f32(accuma)); in arm_svm_polynomial_predict_f32() 375 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,0); in arm_svm_polynomial_predict_f32() 377 accum2 = vpadd_f32(vget_low_f32(accumb),vget_high_f32(accumb)); in arm_svm_polynomial_predict_f32() 378 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,1); in arm_svm_polynomial_predict_f32() 380 accum2 = vpadd_f32(vget_low_f32(accumc),vget_high_f32(accumc)); in arm_svm_polynomial_predict_f32() 381 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,2); in arm_svm_polynomial_predict_f32() 383 accum2 = vpadd_f32(vget_low_f32(accumd),vget_high_f32(accumd)); in arm_svm_polynomial_predict_f32() 384 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,3); in arm_svm_polynomial_predict_f32() 410 accum2 = vpadd_f32(vget_low_f32(accum),vget_high_f32(accum)); in arm_svm_polynomial_predict_f32() [all …]
|
D | arm_svm_sigmoid_predict_f32.c | 315 float32x2_t accum2; in arm_svm_sigmoid_predict_f32() local 372 accum2 = vpadd_f32(vget_low_f32(accuma),vget_high_f32(accuma)); in arm_svm_sigmoid_predict_f32() 373 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,0); in arm_svm_sigmoid_predict_f32() 375 accum2 = vpadd_f32(vget_low_f32(accumb),vget_high_f32(accumb)); in arm_svm_sigmoid_predict_f32() 376 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,1); in arm_svm_sigmoid_predict_f32() 378 accum2 = vpadd_f32(vget_low_f32(accumc),vget_high_f32(accumc)); in arm_svm_sigmoid_predict_f32() 379 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,2); in arm_svm_sigmoid_predict_f32() 381 accum2 = vpadd_f32(vget_low_f32(accumd),vget_high_f32(accumd)); in arm_svm_sigmoid_predict_f32() 382 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,3); in arm_svm_sigmoid_predict_f32() 408 accum2 = vpadd_f32(vget_low_f32(accum),vget_high_f32(accum)); in arm_svm_sigmoid_predict_f32() [all …]
|
D | arm_svm_rbf_predict_f32.c | 335 float32x2_t accum2; in arm_svm_rbf_predict_f32() local 400 accum2 = vpadd_f32(vget_low_f32(accuma),vget_high_f32(accuma)); in arm_svm_rbf_predict_f32() 401 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,0); in arm_svm_rbf_predict_f32() 403 accum2 = vpadd_f32(vget_low_f32(accumb),vget_high_f32(accumb)); in arm_svm_rbf_predict_f32() 404 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,1); in arm_svm_rbf_predict_f32() 406 accum2 = vpadd_f32(vget_low_f32(accumc),vget_high_f32(accumc)); in arm_svm_rbf_predict_f32() 407 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,2); in arm_svm_rbf_predict_f32() 409 accum2 = vpadd_f32(vget_low_f32(accumd),vget_high_f32(accumd)); in arm_svm_rbf_predict_f32() 410 dotV = vsetq_lane_f32(vget_lane_f32(accum2, 0) + vget_lane_f32(accum2, 1),dotV,3); in arm_svm_rbf_predict_f32() 439 accum2 = vpadd_f32(vget_low_f32(accum),vget_high_f32(accum)); in arm_svm_rbf_predict_f32() [all …]
|