Home
last modified time | relevance | path

Searched refs:sum6 (Results 1 – 6 of 6) sorted by relevance

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/cuda_impl/
Dlayer_norm_grad_grad_impl.cu193 … const T &epsilon, T *sum5, T *sum6, T *sum7, T *share_mem, in InputThreadReduceOuterMean() argument
222 sum6[0] += part2; in InputThreadReduceOuterMean()
231 … const half &epsilon, half *sum5, half *sum6, half *sum7, in InputThreadReduceOuterMean() argument
260 sum6[0] += part2; in InputThreadReduceOuterMean()
268 inline __device__ void InputWarpReduceOuterMean(T *sum5, T *sum6, T *sum7) { in InputWarpReduceOuterMean() argument
271 sum6[0] += __shfl_down_sync(0xffffffff, sum6[0], delta); in InputWarpReduceOuterMean()
277 inline __device__ void InputBlockReduceOuterMean(const int &col_dim, T *sum5, T *sum6, T *sum7, T *… in InputBlockReduceOuterMean() argument
284 share_mem[offset + 5] = sum6[0]; in InputBlockReduceOuterMean()
370 T sum6 = 0; in InputPropKernel() local
379 …InputThreadReduceOuterMean(row, col_dim, param_dim, epsilon, &sum5, &sum6, &sum7, share_mem.addr()… in InputPropKernel()
[all …]
/third_party/cmsis/CMSIS/DSP/Source/MatrixFunctions/
Darm_mat_mult_f32.c549 float32_t sum0,sum1, sum2,sum3, sum4, sum5 , sum6, sum7; in arm_mat_mult_f32() local
598 sum6 = 0.0f; in arm_mat_mult_f32()
686 sum6 += vget_lane_f32(accum, 0) + vget_lane_f32(accum, 1); in arm_mat_mult_f32()
704 sum6 += *pIn1G++ * (*pIn2); in arm_mat_mult_f32()
719 *pxG++ = sum6; in arm_mat_mult_f32()
/third_party/ffmpeg/libavfilter/
Dvf_convolution.c192 int sum6 = c0[x] * 5 + c1[x] * -3 + c2[x] * -3 + in filter16_kirsch() local
202 sum6 = FFMAX(sum6, sum7); in filter16_kirsch()
204 sum4 = FFMAX(sum4, sum6); in filter16_kirsch()
295 int sum6 = c0[x] * 5 + c1[x] * -3 + c2[x] * -3 + in filter_kirsch() local
305 sum6 = FFMAX(sum6, sum7); in filter_kirsch()
307 sum4 = FFMAX(sum4, sum6); in filter_kirsch()
/third_party/ffmpeg/libavcodec/mips/
Dhpeldsp_msa.c670 v8u16 sum0, sum1, sum2, sum3, sum4, sum5, sum6, sum7; in common_hv_bil_no_rnd_8x8_msa() local
698 sum6 = add6 + add7 + 1; in common_hv_bil_no_rnd_8x8_msa()
702 SRA_4V(sum4, sum5, sum6, sum7, 2); in common_hv_bil_no_rnd_8x8_msa()
705 PCKEV_B2_SB(sum5, sum4, sum7, sum6, out0, out1); in common_hv_bil_no_rnd_8x8_msa()
/third_party/mindspore/tests/st/ops/gpu/
Dtest_layer_norm_grad_grad_op.py91 sum6 = np.mean(part2, tuple(norm_axis), keepdims=True)
93 part4 = -(x - mean) * np.power(var + epsilon, -1.5) * (sum5 + sum6)
/third_party/ffmpeg/libpostproc/
Dpostprocess_altivec_template.c658 vector signed int sum5, sum6, sum7, sum8, sum9; in dering_altivec() local
694 const vector signed int sump46 = vec_mergel(sum4, sum6); in dering_altivec()