/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-wasmsimd-c16.c | 83 const v128_t vacc89AB = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_low_i16x8(vacc89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local 144 v128_t vacc89AB = wasm_v128_load(b + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local 231 v128_t vacc89AB = wasm_v128_load(buffer + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local
|
D | 7p7x-minmax-rndnu-neon-c16.c | 75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 125 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 203 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
|
D | 7p7x-minmax-fp32-sse41-c16.c | 84 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local 150 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local 236 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local
|
D | 7p7x-minmax-fp32-neonv8-c16.c | 76 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 126 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 202 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
|
D | 7p7x-minmax-fp32-neon-c16.c | 75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 125 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 202 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 97 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 221 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 365 __m128i vacc89AB = _mm_cvtepi16_epi32(vacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
D | 7p7x-minmax-fp32-sse2-c16.c | 106 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vsgnacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local 194 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vsgnacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local 302 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vsgnacc89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local
|
D | 7p7x-minmax-rndnu-neon-c24.c | 88 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 180 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 305 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 89 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 181 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 304 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 96 const v128_t vacc89AB = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_low_i16x8(vacc89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 210 v128_t vacc89AB = wasm_v128_load(b + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 355 v128_t vacc89AB = wasm_v128_load(buffer + 8); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-wasmsimd-c16.c | 83 const v128_t vacc89AB = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_low_u16x8(vacc89ABCDEF)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local 144 v128_t vacc89AB = wasm_v128_load(b + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local 231 v128_t vacc89AB = wasm_v128_load(buffer + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c16() local
|
D | 7p7x-minmax-fp32-sse41-c16.c | 85 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local 152 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local 239 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c16() local
|
D | 7p7x-minmax-rndnu-neon-c16.c | 75 …const int32x4_t vacc89AB = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 125 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 203 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
|
D | 7p7x-minmax-fp32-neonv8-c16.c | 76 …const int32x4_t vacc89AB = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 126 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 202 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
|
D | 7p7x-minmax-fp32-neon-c16.c | 75 …const int32x4_t vacc89AB = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 125 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 202 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
|
D | 7p7x-minmax-rndnu-neon-c24.c | 88 …const int32x4_t vacc89AB = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 180 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 305 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 96 const v128_t vacc89AB = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_low_u16x8(vacc89ABCDEF)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 210 v128_t vacc89AB = wasm_v128_load(b + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 355 v128_t vacc89AB = wasm_v128_load(buffer + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
D | 7p7x-minmax-fp32-sse2-c16.c | 105 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local 191 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local 297 __m128i vacc89AB = _mm_unpacklo_epi16(vacc89ABCDEF, vzero); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse2_c16() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 89 …const int32x4_t vacc89AB = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 181 int32x4_t vacc89AB = vld1q_s32(b + 8); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 304 int32x4_t vacc89AB = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 98 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 223 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 368 __m128i vacc89AB = _mm_cvtepu16_epi32(vacc89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
/external/XNNPACK/src/f32-vrelu/gen/ |
D | vrelu-wasmsimd-x16.c | 34 v128_t vacc89AB = wasm_v128_load(x + 8); in xnn_f32_vrelu_ukernel__wasmsimd_x16() local
|
/external/XNNPACK/src/f32-vhswish/gen/ |
D | vhswish-wasmsimd-x16.c | 43 v128_t vacc89AB = wasm_f32x4_add(vx89AB, vthree); in xnn_f32_vhswish_ukernel__wasmsimd_x16() local
|
D | vhswish-neon-x16.c | 42 float32x4_t vacc89AB = vaddq_f32(vx89AB, vthree); in xnn_f32_vhswish_ukernel__neon_x16() local
|
/external/XNNPACK/src/qu8-vaddc/gen/ |
D | minmax-wasmsimd-x16.c | 40 …v128_t vacc89AB = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_u32x4_extend_low_u16x8(va89ABCDEF), va… in xnn_qu8_vaddc_minmax_ukernel__wasmsimd_x16() local
|
/external/XNNPACK/src/qs8-vaddc/gen/ |
D | minmax-wasmsimd-x16.c | 40 …v128_t vacc89AB = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_low_i16x8(va89ABCDEF), va… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x16() local
|