Searched refs:acc_0 (Results 1 – 2 of 2) sorted by relevance
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32/ |
D | matmul_fp32.c | 897 float32x4_t acc_0; in MatVecMulFp32Neon64() local 900 acc_0 = vld1q_f32(bias + ci); in MatVecMulFp32Neon64() 903 acc_0 = vdupq_n_f32(0.0f); in MatVecMulFp32Neon64() 922 acc_0 = vmlaq_n_f32(acc_0, bv_00, av[0]); in MatVecMulFp32Neon64() 924 acc_0 = vmlaq_n_f32(acc_0, bv_01, av[1]); in MatVecMulFp32Neon64() 926 acc_0 = vmlaq_n_f32(acc_0, bv_02, av[2]); in MatVecMulFp32Neon64() 928 acc_0 = vmlaq_n_f32(acc_0, bv_03, av[3]); in MatVecMulFp32Neon64() 936 acc_0 = vmlaq_n_f32(acc_0, bv0, ai); in MatVecMulFp32Neon64() 945 c[i] = MSMAX(acc_0[i], 0.0f); in MatVecMulFp32Neon64() 947 c[i] = MSMIN(MSMAX(acc_0[i], 0.0f), 6.0f); in MatVecMulFp32Neon64() [all …]
|
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp16/ |
D | matmul_fp16.c | 404 float16x8_t acc_0 = vdupq_n_f16((float16_t)0.0); in VecMatmulFp16() local 407 acc_0 = vld1q_f16(bias); in VecMatmulFp16() 425 acc_0 = vfmaq_n_f16(acc_0, bv_0[i], av[i]); in VecMatmulFp16() 436 acc_0 = vfmaq_n_f16(acc_0, bv0, ai); in VecMatmulFp16() 441 acc_0 = vmaxq_f16(acc_0, vdupq_n_f16((float16_t)0.0)); in VecMatmulFp16() 445 acc_0 = vminq_f16(vmaxq_f16(acc_0, vdupq_n_f16((float16_t)0.0)), vdupq_n_f16((float16_t)6.0)); in VecMatmulFp16() 452 c[i] = acc_0[i]; in VecMatmulFp16() 456 vst1q_f16(c, acc_0); in VecMatmulFp16()
|