/external/XNNPACK/src/qs8-igemm/gen/ |
D | 3x16c8-minmax-neon-mull-padal.c | 355 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mull_padal() local 359 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mull_padal()
|
D | 3x16c16-minmax-neon-mlal-padal.c | 403 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_3x16c16__neon_mlal_padal() local 407 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_3x16c16__neon_mlal_padal()
|
D | 4x16c8-minmax-neon-mull-padal.c | 424 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mull_padal() local 428 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mull_padal()
|
D | 4x16c16-minmax-neon-mlal-padal.c | 488 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_4x16c16__neon_mlal_padal() local 492 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_4x16c16__neon_mlal_padal()
|
D | 3x16c8-minmax-neon-mlal-padal.c | 544 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal() local 548 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_3x16c8__neon_mlal_padal()
|
D | 4x16c8-minmax-neon-mlal-padal.c | 663 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal() local 667 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_igemm_minmax_ukernel_4x16c8__neon_mlal_padal()
|
/external/XNNPACK/src/qs8-gemm/gen/ |
D | 3x16c8-minmax-neon-mull-padal.c | 337 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mull_padal() local 341 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mull_padal()
|
D | 3x16c16-minmax-neon-mlal-padal.c | 385 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_3x16c16__neon_mlal_padal() local 389 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_3x16c16__neon_mlal_padal()
|
D | 4x16c8-minmax-neon-mull-padal.c | 404 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mull_padal() local 408 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mull_padal()
|
D | 3x16c8-minmax-neon-mlal-padal.c | 526 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal() local 530 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_3x16c8__neon_mlal_padal()
|
D | 4x16c16-minmax-neon-mlal-padal.c | 468 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_4x16c16__neon_mlal_padal() local 472 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_4x16c16__neon_mlal_padal()
|
D | 4x16c8-minmax-neon-mlal-padal.c | 643 const int32x2_t vpsum2x8 = vadd_s32(vget_low_s32(vacc2x8), vget_high_s32(vacc2x8)); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal() local 647 const int32x2_t vsum2x89 = vpadd_s32(vpsum2x8, vpsum2x9); in xnn_qs8_gemm_minmax_ukernel_4x16c8__neon_mlal_padal()
|