/external/XNNPACK/src/qu8-requantization/ |
D | gemmlowp-neon.c | 83 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qu8_requantize_gemmlowp__neon() local 87 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qu8_requantize_gemmlowp__neon() local
|
D | fp32-neon.c | 76 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_rounded), w_rounded), vzero_po… in xnn_qu8_requantize_fp32__neon() local 105 const int16x8_t zw_packed = vcombine_s16(vmovn_s32(z_biased), vmovn_s32(w_biased)); in xnn_qu8_requantize_fp32__neon() local
|
D | rndna-neon.c | 115 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qu8_requantize_rndna__neon() local 124 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qu8_requantize_rndna__neon() local
|
D | fp32-sse2.c | 75 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_rounded, w_rounded), vzero_point); in xnn_qu8_requantize_fp32__sse2() local
|
D | fp32-wasmsimd.c | 73 const v128_t zw_packed = wasm_v16x8_shuffle(z_biased, w_biased, 0, 2, 4, 6, 8, 10, 12, 14); in xnn_qu8_requantize_fp32__wasmsimd() local
|
/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/requantization/ |
D | q31-neon.c | 95 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_q31__neon() local 102 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_q31__neon() local
|
D | fp32-neon.c | 86 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_fp32__neon() local 134 const int16x8_t zw_packed = in pytorch_qnnp_requantize_fp32__neon() local
|
D | gemmlowp-neon.c | 94 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_gemmlowp__neon() local 101 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_gemmlowp__neon() local
|
D | precise-neon.c | 138 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_precise__neon() local 154 const int16x8_t zw_packed = vqaddq_s16( in pytorch_qnnp_requantize_precise__neon() local
|
D | fp32-sse2.c | 87 const __m128i zw_packed = in pytorch_qnnp_requantize_fp32__sse2() local
|
D | gemmlowp-ssse3.c | 64 const __m128i zw_packed = in pytorch_qnnp_requantize_gemmlowp__ssse3() local
|
D | gemmlowp-sse2.c | 64 const __m128i zw_packed = in pytorch_qnnp_requantize_gemmlowp__sse2() local
|
D | gemmlowp-sse4.c | 64 const __m128i zw_packed = in pytorch_qnnp_requantize_gemmlowp__sse4() local
|
D | fp32-psimd.c | 98 const psimd_u16 zw_packed = in pytorch_qnnp_requantize_fp32__psimd() local
|
D | precise-sse4.c | 107 const __m128i zw_packed = in pytorch_qnnp_requantize_precise__sse4() local
|
/external/XNNPACK/src/qs8-requantization/ |
D | gemmlowp-neon.c | 83 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_gemmlowp__neon() local 87 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_gemmlowp__neon() local
|
D | fp32-neon.c | 76 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_rounded), w_rounded), vzero_po… in xnn_qs8_requantize_fp32__neon() local 129 const int16x8_t zw_packed = vcombine_s16(vmovn_s32(z_biased), vmovn_s32(w_biased)); in xnn_qs8_requantize_fp32__neon() local
|
D | rndnu-neon-qdmulh.c | 75 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndnu__neon_qdmulh() local 79 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndnu__neon_qdmulh() local
|
D | rndnu-neon-mull.c | 87 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndnu__neon_mull() local 96 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndnu__neon_mull() local
|
D | rndna-neon.c | 115 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndna__neon() local 124 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndna__neon() local
|
D | fp32-sse4.c | 75 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_rounded, w_rounded), vzero_point); in xnn_qs8_requantize_fp32__sse4() local
|
D | fp32-sse2.c | 75 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_rounded, w_rounded), vzero_point); in xnn_qs8_requantize_fp32__sse2() local
|
D | fp32-wasmsimd.c | 73 const v128_t zw_packed = wasm_v16x8_shuffle(z_biased, w_biased, 0, 2, 4, 6, 8, 10, 12, 14); in xnn_qs8_requantize_fp32__wasmsimd() local
|
D | rndnu-sse4-srl.c | 82 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_scaled, w_scaled), vzero_point); in xnn_qs8_requantize_rndnu__sse4_srl() local
|
D | rndnu-sse4-sra.c | 84 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_scaled, w_scaled), vzero_point); in xnn_qs8_requantize_rndnu__sse4_sra() local
|