/external/XNNPACK/src/qs8-gemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 73 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 3x16c4s2-minmax-rndnu-neon-mull.c | 219 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local 256 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 79 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
D | 4x16c4-minmax-rndnu-neondot.c | 76 int32x4_t vacc2xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c4__neondot() local
|
D | 3x16c4-minmax-rndnu-neon-mull-ld1r.c | 296 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld1r() local 333 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld1r() local
|
D | 3x16c4-minmax-rndnu-neon-mull-ld2r.c | 293 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local 330 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local
|
D | 3x16c4-minmax-rndnu-neon-mull-dup.c | 293 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local 330 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local
|
/external/XNNPACK/src/qc8-gemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 72 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qc8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 78 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qc8_gemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
/external/XNNPACK/src/qu8-gemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 73 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qu8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 79 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
D | 3x16c4-minmax-rndnu-neondot.c | 176 int32x4_t vacc2xCDEF = vreinterpretq_s32_u32(vsubq_u32(vpacc2xCDEF, vnacc2x0123)); in xnn_qu8_gemm_minmax_rndnu_ukernel_3x16c4__neondot() local
|
/external/XNNPACK/src/qc8-igemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 69 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qc8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 73 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qc8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
/external/XNNPACK/src/qu8-igemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 70 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qu8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 74 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
D | 3x16c4-minmax-rndnu-neondot.c | 192 int32x4_t vacc2xCDEF = vreinterpretq_s32_u32(vsubq_u32(vpacc2xCDEF, vnacc2x0123)); in xnn_qu8_igemm_minmax_rndnu_ukernel_3x16c4__neondot() local
|
/external/XNNPACK/src/qs8-igemm/gen/ |
D | 3x16c8-minmax-fp32-avx512skx.c | 70 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qs8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 74 __m512i vacc2xCDEF = vacc0xCDEF; in xnn_qs8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
D | 3x16c4s2-minmax-rndnu-neon-mull.c | 237 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local 274 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local
|
D | 4x16c4-minmax-rndnu-neondot.c | 70 int32x4_t vacc2xCDEF = vacc0xCDEF; in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c4__neondot() local
|
D | 3x16c4-minmax-rndnu-neon-mull-ld2r.c | 310 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local 347 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local
|
D | 3x16c4-minmax-rndnu-neon-mull-dup.c | 310 int32x4_t vacc2xCDEF = vpaddq_s32(vacc2xCD, vacc2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local 347 int32x4_t vacc2xCDEF = vcombine_s32(vsum2xCD, vsum2xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local
|
/external/XNNPACK/src/f32-prelu/gen/ |
D | wasmsimd-minmax-4x16.c | 110 v128_t vacc2xCDEF = wasm_i32x4_max(vi2xCDEF, vzero); in xnn_f32_prelu_ukernel__wasmsimd_minmax_4x16() local
|
D | wasmsimd-bitselect-4x16.c | 109 v128_t vacc2xCDEF = wasm_f32x4_mul(vi2xCDEF, vwCDEF); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_4x16() local
|