/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-rndnu-neon-c24.c | 91 …const int32x4_t vaccKLMN = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 184 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 309 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 100 __m128i vaccKLMN = _mm_unpackhi_epi16(vaccGHIJKLMN, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 225 __m128i vaccKLMN = _mm_unpackhi_epi16(vaccGHIJKLMN, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 370 __m128i vaccKLMN = _mm_unpackhi_epi16(vaccGHIJKLMN, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 92 …const int32x4_t vaccKLMN = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 185 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 308 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 99 const v128_t vaccKLMN = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_high_u16x8(vaccGHIJKLMN)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 213 v128_t vaccKLMN = wasm_v128_load(b + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 358 v128_t vaccKLMN = wasm_v128_load(buffer + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
D | 7p7x-minmax-fp32-neon-c24.c | 91 …const int32x4_t vaccKLMN = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 184 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 308 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c32.c | 112 const v128_t vaccKLMN = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_high_u16x8(vaccGHIJKLMN)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 243 v128_t vaccKLMN = wasm_v128_load(b + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 407 v128_t vaccKLMN = wasm_v128_load(buffer + 20); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local
|
D | 7p7x-minmax-rndnu-neon-c32.c | 104 …const int32x4_t vaccKLMN = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 213 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 357 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
|
/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 99 const v128_t vaccKLMN = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_high_i16x8(vaccGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 213 v128_t vaccKLMN = wasm_v128_load(b + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 358 v128_t vaccKLMN = wasm_v128_load(buffer + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 99 __m128i vaccKLMN = _mm_srai_epi32(_mm_unpackhi_epi16(vaccGHIJKLMN, vaccGHIJKLMN), 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 223 __m128i vaccKLMN = _mm_srai_epi32(_mm_unpackhi_epi16(vaccGHIJKLMN, vaccGHIJKLMN), 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 367 __m128i vaccKLMN = _mm_srai_epi32(_mm_unpackhi_epi16(vaccGHIJKLMN, vaccGHIJKLMN), 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 92 const int32x4_t vaccKLMN = vaddw_s16(vinit_bias, vget_high_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 185 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 308 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-rndnu-neon-c24.c | 91 const int32x4_t vaccKLMN = vaddw_s16(vinit_bias, vget_high_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 184 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 309 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-neon-c24.c | 91 const int32x4_t vaccKLMN = vaddw_s16(vinit_bias, vget_high_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 184 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 308 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c32.c | 112 const v128_t vaccKLMN = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_high_i16x8(vaccGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 243 v128_t vaccKLMN = wasm_v128_load(b + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 407 v128_t vaccKLMN = wasm_v128_load(buffer + 20); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local
|
D | 7p7x-minmax-rndnu-neon-c32.c | 104 const int32x4_t vaccKLMN = vaddw_s16(vinit_bias, vget_high_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 213 int32x4_t vaccKLMN = vld1q_s32(b + 20); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 357 int32x4_t vaccKLMN = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
|
/external/XNNPACK/src/qs8-vaddc/gen/ |
D | minmax-wasmsimd-x24.c | 44 …v128_t vaccKLMN = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_high_i16x8(vaGHIJKLMN), v… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x24() local
|
D | minmax-xop-mul32-ld32-x24.c | 54 __m128i vaccKLMN = _mm_macc_epi32(vaKLMN, va_multiplier, vbias); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x24() local
|
D | minmax-sse41-mul32-ld32-x24.c | 49 __m128i vaccKLMN = _mm_add_epi32(vbias, _mm_mullo_epi32(vaKLMN, va_multiplier)); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x24() local
|
D | minmax-avx-mul32-ld32-x24.c | 49 __m128i vaccKLMN = _mm_add_epi32(vbias, _mm_mullo_epi32(vaKLMN, va_multiplier)); in xnn_qs8_vaddc_minmax_ukernel__avx_mul32_ld32_x24() local
|
D | minmax-wasmsimd-x32.c | 45 …v128_t vaccKLMN = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_high_i16x8(vaGHIJKLMN), v… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32() local
|
D | minmax-neon-ld64-x24.c | 49 int32x4_t vaccKLMN = vmlaq_s32(vbias, vmovl_s16(vget_high_s16(vxaGHIJKLMN)), va_multiplier); in xnn_qs8_vaddc_minmax_ukernel__neon_ld64_x24() local
|
/external/XNNPACK/src/qu8-vaddc/gen/ |
D | minmax-wasmsimd-x32.c | 45 …v128_t vaccKLMN = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_u32x4_extend_high_u16x8(vaGHIJKLMN), v… in xnn_qu8_vaddc_minmax_ukernel__wasmsimd_x32() local
|
/external/XNNPACK/src/qs8-vadd/gen/ |
D | minmax-wasmsimd-x24.c | 47 …v128_t vaccKLMN = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_high_i16x8(vaGHIJKLMN), v… in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x24() local
|
/external/XNNPACK/src/f32-qu8-vcvt/gen/ |
D | vcvt-neonv8-x24.c | 54 const int32x4_t vaccKLMN = vcvtnq_s32_f32(vxKLMN); in xnn_f32_qu8_vcvt_ukernel__neonv8_x24() local
|
D | vcvt-avx512skx-x96.c | 64 const __m512i vaccKLMN = _mm512_cvtps_epi32(vxKLMN); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x96() local
|
/external/XNNPACK/src/f32-qs8-vcvt/gen/ |
D | vcvt-neonv8-x24.c | 54 const int32x4_t vaccKLMN = vcvtnq_s32_f32(vxKLMN); in xnn_f32_qs8_vcvt_ukernel__neonv8_x24() local
|