Home
last modified time | relevance | path

Searched refs:vpsum0xD (Results 1 – 24 of 24) sorted by relevance

/external/XNNPACK/src/qs8-gemm/gen/
D1x16c8-minmax-rndnu-neon-mull.c156 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c8__neon_mull() local
159 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c8__neon_mull()
D1x16c16-minmax-rndnu-neon-mlal.c171 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c16__neon_mlal() local
174 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c16__neon_mlal()
D1x16c8-minmax-rndnu-neon-mlal.c245 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c8__neon_mlal() local
248 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x16c8__neon_mlal()
D2x16c8-minmax-rndnu-neon-mull.c223 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local
226 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mull()
D2x16c16-minmax-rndnu-neon-mlal.c254 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local
257 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c16__neon_mlal()
D3x16c8-minmax-rndnu-neon-mull.c290 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
293 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull()
D2x16c8-minmax-rndnu-neon-mlal.c362 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local
365 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mlal()
D3x16c16-minmax-rndnu-neon-mlal.c337 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
340 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal()
D4x16c8-minmax-rndnu-neon-mull.c357 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
360 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull()
D3x16c8-minmax-rndnu-neon-mlal.c479 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
482 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal()
D4x16c16-minmax-rndnu-neon-mlal.c420 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
423 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal()
D4x16c8-minmax-rndnu-neon-mlal.c596 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
599 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal()
/external/XNNPACK/src/qs8-igemm/gen/
D1x16c8-minmax-rndnu-neon-mull.c170 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c8__neon_mull() local
173 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c8__neon_mull()
D1x16c16-minmax-rndnu-neon-mlal.c185 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c16__neon_mlal() local
188 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c16__neon_mlal()
D1x16c8-minmax-rndnu-neon-mlal.c259 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c8__neon_mlal() local
262 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x16c8__neon_mlal()
D2x16c8-minmax-rndnu-neon-mull.c239 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local
242 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mull()
D2x16c16-minmax-rndnu-neon-mlal.c270 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local
273 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c16__neon_mlal()
D2x16c8-minmax-rndnu-neon-mlal.c378 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local
381 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mlal()
D3x16c8-minmax-rndnu-neon-mull.c308 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
311 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull()
D3x16c16-minmax-rndnu-neon-mlal.c355 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
358 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal()
D4x16c8-minmax-rndnu-neon-mull.c377 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
380 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull()
D3x16c8-minmax-rndnu-neon-mlal.c497 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
500 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal()
D4x16c16-minmax-rndnu-neon-mlal.c440 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
443 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal()
D4x16c8-minmax-rndnu-neon-mlal.c616 const int32x2_t vpsum0xD = vadd_s32(vget_low_s32(vacc0x13), vget_high_s32(vacc0x13)); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
619 const int32x2_t vsum0xCD = vpadd_s32(vpsum0xC, vpsum0xD); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal()