Home
last modified time | relevance | path

Searched refs:z_scaled (Results 1 – 25 of 42) sorted by relevance

12

/external/XNNPACK/src/qs8-requantization/
Drndnu-neon-mull.c83 …const int32x4_t z_scaled = vuzp1q_s32(vreinterpretq_s32_s64(z01_scaled), vreinterpretq_s32_s64(z23… in xnn_qs8_requantize_rndnu__neon_mull() local
87 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndnu__neon_mull()
92 const int32x4_t z_scaled = vcombine_s32(vmovn_s64(z01_scaled), vmovn_s64(z23_scaled)); in xnn_qs8_requantize_rndnu__neon_mull() local
96 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndnu__neon_mull()
Drndnu-neon-qdmulh.c70 const int32x4_t z_scaled = vrshlq_s32(z_product, vpost_shift); in xnn_qs8_requantize_rndnu__neon_qdmulh() local
75 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndnu__neon_qdmulh()
79 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndnu__neon_qdmulh()
Dgemmlowp-neon.c78 const int32x4_t z_scaled = vrshlq_s32(z_adjusted_product, vshift); in xnn_qs8_requantize_gemmlowp__neon() local
83 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_gemmlowp__neon()
87 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_gemmlowp__neon()
Dfp32-neon.c58 const float32x4_t z_scaled = vmulq_f32(vcvtq_f32_s32(z), vscale); in xnn_qs8_requantize_fp32__neon() local
67 const int32x4_t z_rounded = vcvtnq_s32_f32(z_scaled); in xnn_qs8_requantize_fp32__neon()
116 const float32x4_t z_clamped = vminq_f32(vmaxq_f32(z_scaled, vfmin), vfmax); in xnn_qs8_requantize_fp32__neon()
Drndna-neon.c111 …const int32x4_t z_scaled = vuzp1q_s32(vreinterpretq_s32_s64(z01_scaled), vreinterpretq_s32_s64(z23… in xnn_qs8_requantize_rndna__neon() local
115 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qs8_requantize_rndna__neon()
120 const int32x4_t z_scaled = vcombine_s32(vmovn_s64(z01_scaled), vmovn_s64(z23_scaled)); in xnn_qs8_requantize_rndna__neon() local
124 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qs8_requantize_rndna__neon()
Dfp32-scalar-fmagic.c44 const float z_scaled = (float) z * scale; in xnn_qs8_requantize_fp32__scalar_fmagic() local
49 const float z_clamped = math_min_f32(math_max_f32(z_scaled, fmin), fmax); in xnn_qs8_requantize_fp32__scalar_fmagic()
Dfp32-sse4.c50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qs8_requantize_fp32__sse4() local
66 const __m128i z_rounded = _mm_cvtps_epi32(z_scaled); in xnn_qs8_requantize_fp32__sse4()
Dfp32-scalar-lrintf.c42 const float z_scaled = (float) z * scale; in xnn_qs8_requantize_fp32__scalar_lrintf() local
47 const float z_clamped = math_min_f32(math_max_f32(z_scaled, fmin), fmax); in xnn_qs8_requantize_fp32__scalar_lrintf()
Dfp32-sse2.c50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qs8_requantize_fp32__sse2() local
66 const __m128i z_rounded = _mm_cvtps_epi32(z_scaled); in xnn_qs8_requantize_fp32__sse2()
Dfp32-wasmsimd.c48 const v128_t z_scaled = wasm_f32x4_mul(wasm_f32x4_convert_i32x4(z), vscale); in xnn_qs8_requantize_fp32__wasmsimd() local
60 const v128_t z_clamped = wasm_f32x4_min(wasm_f32x4_max(z_scaled, vfmin), vfmax); in xnn_qs8_requantize_fp32__wasmsimd()
Drndnu-scalar.c62 const int32_t z_scaled = (int32_t) math_asr_s64(z_product + rounding, shift); in xnn_qs8_requantize_rndnu__scalar() local
68 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qs8_requantize_rndnu__scalar()
Drndna-scalar-signed64.c68 const int32_t z_scaled = (int32_t) math_asr_s64(z_adjusted_product + rounding, shift); in xnn_qs8_requantize_rndna__scalar_signed64() local
74 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qs8_requantize_rndna__scalar_signed64()
Drndna-scalar-unsigned64.c75 const int32_t z_scaled = (int32_t) (z >= 0 ? z_abs_scaled : -z_abs_scaled); in xnn_qs8_requantize_rndna__scalar_unsigned64() local
81 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qs8_requantize_rndna__scalar_unsigned64()
Dgemmlowp-scalar.c103 … const int32_t z_scaled = math_asr_s32(z_q31product, shift) + (int32_t) (z_remainder > threshold); in xnn_qs8_requantize_gemmlowp__scalar() local
109 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qs8_requantize_gemmlowp__scalar()
Drndnu-sse4-sra.c80 const __m128i z_scaled = _mm_sra_epi32(z_prescaled, vshift); in xnn_qs8_requantize_rndnu__sse4_sra() local
84 const __m128i zw_packed = _mm_adds_epi16(_mm_packs_epi32(z_scaled, w_scaled), vzero_point); in xnn_qs8_requantize_rndnu__sse4_sra()
/external/XNNPACK/src/qu8-requantization/
Dgemmlowp-neon.c78 const int32x4_t z_scaled = vrshlq_s32(z_adjusted_product, vshift); in xnn_qu8_requantize_gemmlowp__neon() local
83 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qu8_requantize_gemmlowp__neon()
87 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qu8_requantize_gemmlowp__neon()
Dfp32-neon.c58 const float32x4_t z_scaled = vmulq_f32(vcvtq_f32_s32(z), vscale); in xnn_qu8_requantize_fp32__neon() local
67 const int32x4_t z_rounded = vcvtnq_s32_f32(z_scaled); in xnn_qu8_requantize_fp32__neon()
92 const float32x4_t z_clamped = vminq_f32(vmaxq_f32(z_scaled, vfmin), vfmax); in xnn_qu8_requantize_fp32__neon()
Drndna-neon.c111 …const int32x4_t z_scaled = vuzp1q_s32(vreinterpretq_s32_s64(z01_scaled), vreinterpretq_s32_s64(z23… in xnn_qu8_requantize_rndna__neon() local
115 …const int16x8_t zw_packed = vqaddq_s16(vqmovn_high_s32(vqmovn_s32(z_scaled), w_scaled), vzero_poin… in xnn_qu8_requantize_rndna__neon()
120 const int32x4_t z_scaled = vcombine_s32(vmovn_s64(z01_scaled), vmovn_s64(z23_scaled)); in xnn_qu8_requantize_rndna__neon() local
124 …const int16x8_t zw_packed = vqaddq_s16(vcombine_s16(vqmovn_s32(z_scaled), vqmovn_s32(w_scaled)), v… in xnn_qu8_requantize_rndna__neon()
Dfp32-sse2.c50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qu8_requantize_fp32__sse2() local
66 const __m128i z_rounded = _mm_cvtps_epi32(z_scaled); in xnn_qu8_requantize_fp32__sse2()
Dfp32-scalar-fmagic.c44 const float z_scaled = (float) z * scale; in xnn_qu8_requantize_fp32__scalar_fmagic() local
49 const float z_clamped = math_min_f32(math_max_f32(z_scaled, fmin), fmax); in xnn_qu8_requantize_fp32__scalar_fmagic()
Dfp32-scalar-lrintf.c42 const float z_scaled = (float) z * scale; in xnn_qu8_requantize_fp32__scalar_lrintf() local
47 const float z_clamped = math_min_f32(math_max_f32(z_scaled, fmin), fmax); in xnn_qu8_requantize_fp32__scalar_lrintf()
Dfp32-wasmsimd.c48 const v128_t z_scaled = wasm_f32x4_mul(wasm_f32x4_convert_i32x4(z), vscale); in xnn_qu8_requantize_fp32__wasmsimd() local
60 const v128_t z_clamped = wasm_f32x4_min(wasm_f32x4_max(z_scaled, vfmin), vfmax); in xnn_qu8_requantize_fp32__wasmsimd()
Drndna-scalar-signed64.c68 const int32_t z_scaled = (int32_t) math_asr_s64(z_adjusted_product + rounding, shift); in xnn_qu8_requantize_rndna__scalar_signed64() local
74 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qu8_requantize_rndna__scalar_signed64()
Drndna-scalar-unsigned64.c75 const int32_t z_scaled = (int32_t) (z >= 0 ? z_abs_scaled : -z_abs_scaled); in xnn_qu8_requantize_rndna__scalar_unsigned64() local
81 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qu8_requantize_rndna__scalar_unsigned64()
Dgemmlowp-scalar.c103 … const int32_t z_scaled = math_asr_s32(z_q31product, shift) + (int32_t) (z_remainder > threshold); in xnn_qu8_requantize_gemmlowp__scalar() local
109 const int32_t z_clamped = math_min_s32(math_max_s32(z_scaled, smin), smax); in xnn_qu8_requantize_gemmlowp__scalar()

12