Home
last modified time | relevance | path

Searched refs:vmuls (Results 1 – 20 of 20) sorted by relevance

/third_party/mindspore/mindspore/ops/_op_impl/_custom_op/
Dbatchnorm_fold.py67 batch_mean = te.lang.cce.vmuls(x_sum, num_rec)
70 variance_div = te.lang.cce.vmuls(x_square_sum, num_rec)
78 batch_var_unbiased = te.lang.cce.vmuls(batch_var_biased, batch_var_scaler)
82 mean_mul = te.lang.cce.vmuls(batch_mean, factor)
83 mean_mul_rev = te.lang.cce.vmuls(mean, factor_reverse)
86 var_mul = te.lang.cce.vmuls(batch_var_unbiased, factor)
87 var_mul_rev = te.lang.cce.vmuls(variance, factor_reverse)
Dmatmul_cube_dense_right_impl.py118 … tik_instance.vmuls(64, resmatmul_local_ub, resmatmul_local_ub, matrix_max_scalar, 255, 1, 1, 8, 8)
119 tik_instance.vmuls(64, resmatmul_local_ub[255 * 64], resmatmul_local_ub[255 * 64],
121 tik_instance.vmuls(64, resmatmul_local_ub[510 * 64], resmatmul_local_ub[510 * 64],
171 … tik_instance.vmuls(64, resmatmul_local_ub, resmatmul_local_ub, matrix_max_scalar, 255, 1, 1, 8, 8)
172 …tik_instance.vmuls(64, resmatmul_local_ub[255 * 64], resmatmul_local_ub[255 * 64], matrix_max_scal…
174 …tik_instance.vmuls(64, resmatmul_local_ub[510 * 64], resmatmul_local_ub[510 * 64], matrix_max_scal…
195 …tik_instance.vmuls(64, resmatmul_local_ub1, resmatmul_local_ub1, matrix_max_scalar, 255, 1, 1, 8, …
196 …tik_instance.vmuls(64, resmatmul_local_ub1[255 * 64], resmatmul_local_ub1[255 * 64], matrix_max_sc…
Dcholesky_trsm_impl.py65 … tik_instance.vmuls(64, assist_2_ub[0], assist_1_ub[0], scalar1, vector_repeat_times, 1, 1, 8, 8)
68 …tik_instance.vmuls(64, input_x_ub[i, 0], input_x_ub[i, 0], scalar2, vector_repeat_times, 1, 1, 8, …
72 … tik_instance.vmuls(64, temp_ub[j, 0], input_x_ub[i, 0], scalar3, vector_repeat_times, 1, 1, 8, 8)
96 … tik_instance.vmuls(64, assist_2_ub, temp_ub[j + index + 1, 0], chol_diag_element_loop,
105 …tik_instance.vmuls(64, temp_ub[index, 0], temp_ub[index, 0], chol_diag_element, vector_repeat_time…
Dminmax_update_perchannel.py69 min_val = te.lang.cce.vadd(te.lang.cce.vmuls(
70 min_val, ema_decay), te.lang.cce.vmuls(x_min, (1 - ema_decay)))
71 max_val = te.lang.cce.vadd(te.lang.cce.vmuls(
72 max_val, ema_decay), te.lang.cce.vmuls(x_max, (1 - ema_decay)))
Dminmax_update_perlayer.py66 min_val = te.lang.cce.vadd(te.lang.cce.vmuls(
67 min_val, ema_decay), te.lang.cce.vmuls(x_min, (1 - ema_decay)))
68 max_val = te.lang.cce.vadd(te.lang.cce.vmuls(
69 max_val, ema_decay), te.lang.cce.vmuls(x_max, (1 - ema_decay)))
Dfake_quant_perlayer_grad.py67 res_max_mul = te.lang.cce.vmuls(res_max, max_value)
68 res_max_mul_max = te.lang.cce.vmuls(res_max_mul, max_value)
69 res = te.lang.cce.vmuls(res_max_mul_max, factor_value)
92 max_val = te.lang.cce.vmax(te.lang.cce.vmuls(min_val, -1.), max_val)
93 min_val = te.lang.cce.vmuls(max_val, -1.)
Dfake_learned_scale_quant_perchannel_grad.py77 res_mul1 = te.lang.cce.vmuls(vmin, max_support_fp32)
78 res_mul2 = te.lang.cce.vmuls(res_mul1, max_support_fp32)
79 sign = te.lang.cce.vmuls(res_mul2, tvm.const(2 ** 2, dtype=dtype))
84 res_mul1 = te.lang.cce.vmuls(vmin, max_support_fp16)
85 sign = te.lang.cce.vmuls(res_mul1, max_support_fp16)
Dfake_learned_scale_quant_perlayer_grad.py78 res_mul1 = te.lang.cce.vmuls(vmin, max_support_fp32)
79 res_mul2 = te.lang.cce.vmuls(res_mul1, max_support_fp32)
80 sign = te.lang.cce.vmuls(res_mul2, tvm.const(2 ** 2, dtype=dtype))
85 res_mul1 = te.lang.cce.vmuls(vmin, max_support_fp16)
86 sign = te.lang.cce.vmuls(res_mul1, max_support_fp16)
Dfake_quant_perchannel_grad.py66 res_max_mul = te.lang.cce.vmuls(res_max, max_value)
67 res_max_mul_max = te.lang.cce.vmuls(res_max_mul, max_value)
68 res = te.lang.cce.vmuls(res_max_mul_max, factor_value)
Dbatchnorm_fold2_grad.py71 d_batch_mean = te.lang.cce.vmuls(d_batch_mean, -1.)
75 d_gamma = te.lang.cce.vmuls(d_gamma, -1.)
Dfake_quant_perchannel.py61 max_val = te.lang.cce.vmax(te.lang.cce.vmuls(min_val, -1.), max_val)
62 min_val = te.lang.cce.vmuls(max_val, -1.)
Dfake_quant_perlayer.py61 max_val = te.lang.cce.vmax(te.lang.cce.vmuls(min_val, -1.), max_val)
62 min_val = te.lang.cce.vmuls(max_val, -1.)
Dmatmul_cube_fracz_right_mul_impl.py233 tik_instance.vmuls(vectorfp32_size,
239 tik_instance.vmuls(vectorfp32_size,
Dbatchnorm_fold_grad.py71 dx = te.lang.cce.vmuls(dx, tvm.const(1. / normal_size, dtype=dx.dtype))
Dmatmul_dds_impl.py339 tik_inst.vmuls(
/third_party/skia/third_party/externals/swiftshader/third_party/subzero/src/
DIceAssemblerARM32.h555 void vmuls(const Operand *OpSd, const Operand *OpSn, const Operand *OpSm,
DIceInstARM32.cpp1269 Asm->vmuls(Dest, getSrc(0), getSrc(1), CondARM32::AL); in emitIAS()
DIceAssemblerARM32.cpp3297 void AssemblerARM32::vmuls(const Operand *OpSd, const Operand *OpSn, in vmuls() function in Ice::ARM32::AssemblerARM32
/third_party/skia/third_party/externals/swiftshader/third_party/subzero/src/DartARM32/
Dassembler_arm.h676 void vmuls(SRegister sd, SRegister sn, SRegister sm, Condition cond = AL);
Dassembler_arm.cc950 void Assembler::vmuls(SRegister sd, SRegister sn, SRegister sm,