Home
last modified time | relevance | path

Searched refs:MS_MLAQ_F32 (Results 1 – 5 of 5) sorted by relevance

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/intrinsics/sse/
DConvDwFp32Row_sse.c43 dst1 = MS_MLAQ_F32(dst1, w1, in1); in ConvDwFp32Row()
44 dst2 = MS_MLAQ_F32(dst2, w2, in2); in ConvDwFp32Row()
45 dst3 = MS_MLAQ_F32(dst3, w3, in3); in ConvDwFp32Row()
46 dst4 = MS_MLAQ_F32(dst4, w4, in4); in ConvDwFp32Row()
62 dst1 = MS_MLAQ_F32(dst1, w1, in1); in ConvDwFp32Row()
63 dst2 = MS_MLAQ_F32(dst2, w2, in2); in ConvDwFp32Row()
74 dst1 = MS_MLAQ_F32(dst1, w1, in1); in ConvDwFp32Row()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32/
Dscale_fp32.c44 MS_FLOAT32X4 result = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleInner()
77 MS_FLOAT32X4 result = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleAxis()
135 MS_FLOAT32X4 tmp = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleInnerRelu()
177 MS_FLOAT32X4 tmp = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleAxisRelu()
239 MS_FLOAT32X4 tmp = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleInnerRelu6()
283 MS_FLOAT32X4 tmp = MS_MLAQ_F32(offset_4, data, scale_4); in ScaleAxisRelu6()
Dconv_depthwise_fp32.c606 acc0 = MS_MLAQ_F32(acc0, MS_LDQ_F32(line1), g10); in ConvDw3x3Line()
607 acc1 = MS_MLAQ_F32(acc1, MS_LDQ_F32(line1 + 4), g11); in ConvDw3x3Line()
608 acc2 = MS_MLAQ_F32(acc2, MS_LDQ_F32(line1 + 8), g12); in ConvDw3x3Line()
609 acc3 = MS_MLAQ_F32(acc3, MS_LDQ_F32(line1 + 12), g13); in ConvDw3x3Line()
611 acc0 = MS_MLAQ_F32(acc0, MS_LDQ_F32(line2), g20); in ConvDw3x3Line()
612 acc1 = MS_MLAQ_F32(acc1, MS_LDQ_F32(line2 + 4), g21); in ConvDw3x3Line()
613 acc2 = MS_MLAQ_F32(acc2, MS_LDQ_F32(line2 + 8), g22); in ConvDw3x3Line()
614 acc3 = MS_MLAQ_F32(acc3, MS_LDQ_F32(line2 + 12), g23); in ConvDw3x3Line()
644 acc0 = MS_MLAQ_F32(acc0, MS_LDQ_F32(line1), g10); in ConvDw3x3Line()
645 acc1 = MS_MLAQ_F32(acc1, MS_LDQ_F32(line1 + 4), g11); in ConvDw3x3Line()
[all …]
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/intrinsics/
Dms_simd_instructions.h56 #define MS_MLAQ_F32(src1, src2, src3) vmlaq_f32(src1, src2, src3) macro
132 #define MS_MLAQ_F32(src1, src2, src3) _mm_add_ps(src1, _mm_mul_ps(src2, src3)) macro
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/base/
Dminimal_filtering_generator.c246 res = MS_MLAQ_F32(res, matrix_a[h_offset + i], matrix_b[w + i * n]); in MatrixMultiplyVec()