Home
last modified time | relevance | path

Searched refs:mat_b (Results 1 – 13 of 13) sorted by relevance

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp16_grad/
Dconvolution_grad_input.c42 const float16_t *mat_b[C16NUM]; in ConvDwInputGrad16() local
44 mat_b[j_i] = w + (j + j_i) * k_spatial; in ConvDwInputGrad16()
61 float16x8_t mat_b0 = {mat_b[0][k], mat_b[1][k], mat_b[2][k], mat_b[3][k], in ConvDwInputGrad16()
62 mat_b[4][k], mat_b[5][k], mat_b[6][k], mat_b[7][k]}; in ConvDwInputGrad16()
63 float16x8_t mat_b1 = {mat_b[8][k], mat_b[9][k], mat_b[10][k], mat_b[11][k], in ConvDwInputGrad16()
64 mat_b[12][k], mat_b[13][k], mat_b[14][k], mat_b[15][k]}; in ConvDwInputGrad16()
80 … : "r"(mat_b[0] + k), "r"(mat_b[1] + k), "r"(mat_b[2] + k), "r"(mat_b[3] + k), "r"(mat_b[4] + k), in ConvDwInputGrad16()
81 "r"(mat_b[5] + k), "r"(mat_b[6] + k), "r"(mat_b[7] + k) in ConvDwInputGrad16()
93 …: "r"(mat_b[8] + k), "r"(mat_b[9] + k), "r"(mat_b[10] + k), "r"(mat_b[11] + k), "r"(mat_b[12] + k), in ConvDwInputGrad16()
94 "r"(mat_b[13] + k), "r"(mat_b[14] + k), "r"(mat_b[15] + k) in ConvDwInputGrad16()
[all …]
Dgemm_fp16.h31 float16_t *mat_b; member
35 … const float16_t *mat_b, int ldb, float16_t beta, float16_t *mat_c, int ldc, float16_t *workspace);
37 const float16_t *mat_b, int ldb, float16_t beta, float16_t *mat_c, int ldc,
Dgemm_fp16.c339 …const float16_t *mat_b, int ldb, float16_t beta, float16_t *mat_c, int ldc, float16_t *workspace) { in GemmMatmulFp16() argument
345 …GemmMatmulPlusFp16(ta, tb, M, N, K, alpha, mat_a, lda, mat_b, ldb, beta, mat_c, ldc, workspace, &g… in GemmMatmulFp16()
349 const float16_t *mat_b, int ldb, float16_t beta, float16_t *mat_c, int ldc, in GemmMatmulPlusFp16() argument
360 float16_t *mat_b_input = (float16_t *)mat_b; in GemmMatmulPlusFp16()
375 RowMajor2Col8MajorStrideFp16(mat_b, mat_b_input, N, K, ldb); in GemmMatmulPlusFp16()
377 RowMajor2Row8MajorStrideFp16(mat_b, mat_b_input, K, N, ldb); in GemmMatmulPlusFp16()
384 gcb->mat_b = mat_b_input; in GemmMatmulPlusFp16()
/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/fp32_grad/
Dgemm.h31 float *mat_b; member
34 …(int ta, int tb, int M, int N, int K, float alpha, const float *mat_a, int lda, const float *mat_b,
36 …(int ta, int tb, int M, int N, int K, float alpha, const float *mat_a, int lda, const float *mat_b,
Dgemm.c539 …(int ta, int tb, int M, int N, int K, float alpha, const float *mat_a, int lda, const float *mat_b, argument
547 gcb.mat_b = NULL;
548 GemmMatmulPlus(ta, tb, M, N, K, alpha, mat_a, lda, mat_b, ldb, beta, mat_c, ldc, workspace, &gcb);
551 …(int ta, int tb, int M, int N, int K, float alpha, const float *mat_a, int lda, const float *mat_b, argument
562 float *mat_b_input = (float *)mat_b;
589 RowMajor2Col8MajorStride(mat_b, mat_b_input, N, K, ldb);
591 RowMajor2Row8MajorStride(mat_b, mat_b_input, K, N, ldb);
602 gcb->mat_b = mat_b_input;
Dconvolution_grad_input.c62 float32x4_t mat_b = {mat_b_0[k], mat_b_1[k], mat_b_2[k], mat_b_3[k]}; in ConvDwInputGrad() local
64 mat_c = vmlaq_f32(mat_c, mat_b, mat_a); in ConvDwInputGrad()
/third_party/mindspore/mindspore/lite/src/runtime/kernel/arm/fp32_grad/
Dconvolution.cc108 const float *mat_b = nullptr; in Execute() local
119 mat_b = w_addr + j * nweights / groups; in Execute()
121 …GemmMatmul(0, 1, real_chunk, n, k, 1, mat_a + (j * kernel_spatial), k * groups, mat_b, k, 0, mat_c… in Execute()
132 mat_b = w_addr + j * nweights / groups; in Execute()
136 … GemmMatmul(0, 1, real_chunk, n, k, 1, mat_a, k, mat_b, k, 0, mat_c, out_ch, mat_workspace); in Execute()
141 mat_b = w_addr; in Execute()
151 … GemmMatmul(0, 1, real_chunk, n, k, 1, im + offset, k, mat_b, k, 0, mat_c, out_ch, mat_workspace); in Execute()
Dconvolution_grad_input.cc129 float *mat_b = nullptr; in Execute() local
131 mat_b = w_addr + j * nweights / groups; in Execute()
137 mat_b = gcb.mat_b; in Execute()
144 …GemmMatmulPlus(0, 0, real_chunk, n, k, 1, mat_a, out_ch, mat_b, n, 0, mat_c, n, mat_workspace, &gc… in Execute()
150 …GemmMatmulPlus(0, 0, real_chunk, n, k, 1, mat_a, out_ch, mat_b, n, 0, mat_c, n, mat_workspace, &gc… in Execute()
Dconvolution_grad_filter.cc122 float *mat_b = nullptr; in Execute() local
142 mat_b = workspace_temp + task_id * ws_size_; in Execute()
144 RollingIm2ColPackDwUnitFp32(im, conv_param, mat_b, real_chunk, ci); in Execute()
148 …GemmMatmul(1, 0, k, n, real_chunk, 1, mat_a, out_ch, mat_b + (j * kernel_spatial), n * groups, 1, … in Execute()
160 mat_b = workspace_temp + task_id * ws_size_; in Execute()
163 RollingIm2ColPackUnitFp32(im, conv_param, mat_b, real_chunk, ci); in Execute()
164 … GemmMatmul(1, 0, k, n, real_chunk, 1, mat_a, out_ch, mat_b, n, 0, mat_tmp, n, mat_workspace); in Execute()
Ddeconvolution_grad_filter.cc112 float *mat_b = workspace_temp; in Execute() local
115 rolling_im2row_hwc(im, mat_b, conv_param, real_chunk, ci); in Execute()
116 …GemmMatmul(0, 0, n, m, real_chunk * in_w, 1, mat_b, real_chunk * in_w, mat_a, in_ch, 1, mat_c, in_… in Execute()
/third_party/mindspore/mindspore/lite/src/runtime/kernel/arm/fp16_grad/
Dconvolution_fp16_grad_input.cc125 float16_t *mat_b = nullptr; in DoExecute() local
127 mat_b = w_addr + j * nweights / groups; in DoExecute()
133 mat_b = gcb.mat_b; in DoExecute()
140 …GemmMatmulPlusFp16(0, 0, real_chunk, n, k, 1, mat_a, out_ch, mat_b, n, 0, mat_c, n, mat_workspace,… in DoExecute()
147 …GemmMatmulPlusFp16(0, 0, real_chunk, n, k, 1, mat_a, out_ch, mat_b, n, 0, mat_c, n, mat_workspace,… in DoExecute()
Dconvolution_fp16_grad_filter.cc135 float16_t *mat_b = workspace_temp + task_id * ws_size_; in DoExecute()
137 RollingIm2ColPackDwUnitFp16(im, conv_param, mat_b, real_chunk, ci); in DoExecute()
141 …GemmMatmulFp16(1, 0, k, n, real_chunk, 1, mat_a, out_ch, mat_b + (j * kernel_spatial), n * groups,… in DoExecute()
153 float16_t *mat_b = workspace_temp + task_id * ws_size_; in DoExecute() local
156 RollingIm2ColPackUnitFp16(im, conv_param, mat_b, real_chunk, ci); in DoExecute()
157 … GemmMatmulFp16(1, 0, k, n, real_chunk, 1, mat_a, out_ch, mat_b, n, 0, mat_tmp, n, mat_workspace); in DoExecute()
/third_party/boost/libs/qvm/test/
Dcmp_mm_test.cpp63 typedef boost::qvm::mat<scalar_b, 3, 3> mat_b; in test2() typedef
65 mat_b const b = { { {42, 94, 96}, {72, 95, 81}, {12, 84, 33} } }; in test2()
67 mat_b const d = { { {21, 47, 48}, {36, 47, 65}, {79, 27, 41} } }; in test2()