Home
last modified time | relevance | path

Searched refs:vprod0x9 (Results 1 – 24 of 24) sorted by relevance

/external/XNNPACK/src/qs8-igemm/gen/
D1x16c8-minmax-neon-mlal-padal.c132 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
133 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
134 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
195 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
196 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
D1x16c16-minmax-neon-mlal-padal.c121 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_1x16c16__neon_mlal_padal() local
122 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_1x16c16__neon_mlal_padal()
123 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_1x16c16__neon_mlal_padal()
D2x16c8-minmax-neon-mlal-padal.c185 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mlal_padal() local
187 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mlal_padal()
189 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mlal_padal()
288 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mlal_padal() local
290 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mlal_padal()
D2x16c16-minmax-neon-mlal-padal.c173 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_2x16c16__neon_mlal_padal() local
175 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_2x16c16__neon_mlal_padal()
177 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_2x16c16__neon_mlal_padal()
D3x16c8-minmax-neon-mlal-padal.c238 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal() local
241 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal()
244 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal()
381 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal() local
384 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal()
D1x16c8-minmax-neon-mull-padal.c106 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mull_padal() local
107 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mull_padal()
D3x16c16-minmax-neon-mlal-padal.c225 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_3x16c16__neon_mlal_padal() local
228 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_3x16c16__neon_mlal_padal()
231 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_3x16c16__neon_mlal_padal()
D4x16c8-minmax-neon-mlal-padal.c291 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal() local
295 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal()
299 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal()
474 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal() local
478 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal()
D2x16c8-minmax-neon-mull-padal.c149 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mull_padal() local
151 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_2x16c8__neon_mull_padal()
D4x16c16-minmax-neon-mlal-padal.c277 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_4x16c16__neon_mlal_padal() local
281 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_4x16c16__neon_mlal_padal()
285 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_4x16c16__neon_mlal_padal()
D3x16c8-minmax-neon-mull-padal.c192 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mull_padal() local
195 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mull_padal()
D4x16c8-minmax-neon-mull-padal.c235 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mull_padal() local
239 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mull_padal()
/external/XNNPACK/src/qs8-gemm/gen/
D1x16c8-minmax-neon-mlal-padal.c121 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
122 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
123 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
184 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
185 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
D1x16c16-minmax-neon-mlal-padal.c110 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_1x16c16__neon_mlal_padal() local
111 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_1x16c16__neon_mlal_padal()
112 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_1x16c16__neon_mlal_padal()
D2x16c8-minmax-neon-mlal-padal.c172 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mlal_padal() local
174 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mlal_padal()
176 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mlal_padal()
275 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mlal_padal() local
277 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mlal_padal()
D2x16c16-minmax-neon-mlal-padal.c160 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_2x16c16__neon_mlal_padal() local
162 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_2x16c16__neon_mlal_padal()
164 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_2x16c16__neon_mlal_padal()
D3x16c8-minmax-neon-mlal-padal.c223 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal() local
226 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal()
229 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal()
366 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal() local
369 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal()
D1x16c8-minmax-neon-mull-padal.c95 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mull_padal() local
96 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mull_padal()
D3x16c16-minmax-neon-mlal-padal.c210 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_3x16c16__neon_mlal_padal() local
213 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_3x16c16__neon_mlal_padal()
216 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_3x16c16__neon_mlal_padal()
D4x16c8-minmax-neon-mlal-padal.c274 int16x8_t vprod0x9 = vmull_s8(vb9x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal() local
278 vprod0x9 = vmlal_s8(vprod0x9, vb9x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal()
282 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal()
457 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal() local
461 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal()
D2x16c8-minmax-neon-mull-padal.c136 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mull_padal() local
138 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_2x16c8__neon_mull_padal()
D4x16c16-minmax-neon-mlal-padal.c260 int16x8_t vprod0x9 = vmull_s8(vget_low_s8(vb9), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_4x16c16__neon_mlal_padal() local
264 vprod0x9 = vmlal_s8(vprod0x9, vget_high_s8(vb9), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_4x16c16__neon_mlal_padal()
268 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_4x16c16__neon_mlal_padal()
D3x16c8-minmax-neon-mull-padal.c177 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mull_padal() local
180 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mull_padal()
D4x16c8-minmax-neon-mull-padal.c218 const int16x8_t vprod0x9 = vmull_s8(vb9, va0); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mull_padal() local
222 vacc0x9 = vpadalq_s16(vacc0x9, vprod0x9); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mull_padal()