/external/XNNPACK/src/qs8-gemm/gen/ |
D | 2x16c4s2-minmax-rndnu-neon-mull.c | 167 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local 192 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local
|
D | 2x16c8-minmax-fp32-avx512skx.c | 63 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 69 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 2x16c4-minmax-rndnu-neon-mull-dup.c | 222 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_dup() local 247 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_dup() local
|
D | 2x16c4-minmax-rndnu-neon-mull-ld2r.c | 222 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local 247 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local
|
D | 2x16c4-minmax-rndnu-neon-mull-ld1r.c | 224 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local 249 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local
|
D | 3x16c4s2-minmax-rndnu-neon-mull.c | 215 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local 244 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local
|
D | 4x16c8-minmax-fp32-avx512skx.c | 75 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qs8_gemm_minmax_fp32_ukernel_4x16c8__avx512skx() local
|
/external/XNNPACK/src/f32-prelu/gen/ |
D | wasmsimd-minmax-2x16.c | 80 v128_t vacc1xCDEF = wasm_i32x4_max(vi1xCDEF, vzero); in xnn_f32_prelu_ukernel__wasmsimd_minmax_2x16() local
|
D | wasmsimd-bitselect-2x16.c | 79 v128_t vacc1xCDEF = wasm_f32x4_mul(vi1xCDEF, vwCDEF); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_2x16() local
|
D | neon-2x16.c | 76 float32x4_t vacc1xCDEF = vmulq_f32(vi1xCDEF, vwCDEF); in xnn_f32_prelu_ukernel__neon_2x16() local
|
/external/XNNPACK/src/qu8-gemm/gen/ |
D | 2x16c8-minmax-fp32-avx512skx.c | 63 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qu8_gemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 69 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qu8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
/external/XNNPACK/src/qc8-gemm/gen/ |
D | 2x16c8-minmax-fp32-avx512skx.c | 62 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qc8_gemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 68 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qc8_gemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
/external/XNNPACK/src/qs8-igemm/gen/ |
D | 2x16c4s2-minmax-rndnu-neon-mull.c | 183 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local 208 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local
|
D | 2x16c8-minmax-fp32-avx512skx.c | 62 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qs8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 66 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qs8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
D | 2x16c4-minmax-rndnu-neon-mull-dup.c | 237 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_dup() local 262 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_dup() local
|
D | 2x16c4-minmax-rndnu-neon-mull-ld2r.c | 237 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local 262 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local
|
D | 2x16c4-minmax-rndnu-neon-mull-ld1r.c | 239 int32x4_t vacc1xCDEF = vpaddq_s32(vacc1xCD, vacc1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local 264 int32x4_t vacc1xCDEF = vcombine_s32(vsum1xCD, vsum1xEF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local
|
/external/XNNPACK/src/qu8-igemm/gen/ |
D | 2x16c8-minmax-fp32-avx512skx.c | 62 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qu8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 66 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qu8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|
/external/XNNPACK/src/qc8-igemm/gen/ |
D | 2x16c8-minmax-fp32-avx512skx.c | 61 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qc8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx() local
|
D | 3x16c8-minmax-fp32-avx512skx.c | 65 __m512i vacc1xCDEF = vacc0xCDEF; in xnn_qc8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx() local
|