Home
last modified time | relevance | path

Searched refs:dst_4 (Results 1 – 6 of 6) sorted by relevance

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp16_grad/
Darithmetic_self_grad.c29 float16x8_t dst_4 = vmulq_f16(src0_4, vrecpeq_f16(vmulq_f16(src1_4, log_10))); in Fp16LogGrad() local
30 vst1q_f16(dst + i, dst_4); in Fp16LogGrad()
Dactivation_grad.c135 float16x4_t dst_4 = vbsl_f16(mask_4, src0_4, vmul_f16(alpha_4, vmul_f16(expm1_4, src0_4))); in EluFp16Grad() local
136 vst1_f16(dst + i, dst_4); in EluFp16Grad()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32_grad/
Dactivation_grad.c32 float32x4_t dst_4 = vbslq_f32(mask_4, src0_4, zero_4); in ReluGrad() local
33 vst1q_f32(dst + i, dst_4); in ReluGrad()
53 float32x4_t dst_4 = vbslq_f32(mask_4, src0_4, zero_4); in Relu6Grad() local
54 vst1q_f32(dst + i, dst_4); in Relu6Grad()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32/
Dconv_common_fp32.c440 float *dst_4 = dst + out_step * C3NUM; in SWConv3x32Kernel() local
587 : "a"(act_flag), "r"(out_step), "r"(dst), "r"(write_mode), "r"(dst_4) in SWConv3x32Kernel()
599 float *dst_4 = dst + out_step * C3NUM; in SWConv1x32Kernel() local
683 : "a"(act_flag), "r"(out_step), "r"(dst), "r"(write_mode), "r"(dst_4) in SWConv1x32Kernel()
Dconv_depthwise_fp32.c877 float32x4_t dst_4 = vld1q_f32(dst_kw); in DeconvDwBorderPixel() local
878 dst_4 = vfmaq_f32(dst_4, src_4, weight_4); in DeconvDwBorderPixel()
879 vst1q_f32(dst_kw, dst_4); in DeconvDwBorderPixel()
/third_party/mesa3d/src/intel/compiler/
Dbrw_vec4_generator.cpp1134 struct brw_reg dst_4 = suboffset(vec1(dst), 4); in generate_unpack_flags() local
1137 brw_AND(p, dst_4, flags, brw_imm_ud(0xf0)); in generate_unpack_flags()
1138 brw_SHR(p, dst_4, dst_4, brw_imm_ud(4)); in generate_unpack_flags()