/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 98 const v128_t vaccGHIJ = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_low_u16x8(vaccGHIJKLMN)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 212 v128_t vaccGHIJ = wasm_v128_load(b + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 357 v128_t vaccGHIJ = wasm_v128_load(buffer + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 91 …const int32x4_t vaccGHIJ = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 184 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 307 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 100 __m128i vaccGHIJ = _mm_cvtepu16_epi32(vaccGHIJKLMN); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 225 __m128i vaccGHIJ = _mm_cvtepu16_epi32(vaccGHIJKLMN); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 370 __m128i vaccGHIJ = _mm_cvtepu16_epi32(vaccGHIJKLMN); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
D | 7p7x-minmax-rndnu-neon-c24.c | 90 …const int32x4_t vaccGHIJ = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 183 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 308 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-neon-c24.c | 90 …const int32x4_t vaccGHIJ = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 183 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 307 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c32.c | 111 const v128_t vaccGHIJ = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_low_u16x8(vaccGHIJKLMN)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 242 v128_t vaccGHIJ = wasm_v128_load(b + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 406 v128_t vaccGHIJ = wasm_v128_load(buffer + 16); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local
|
D | 7p7x-minmax-rndnu-neon-c32.c | 103 …const int32x4_t vaccGHIJ = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 212 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 356 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
|
/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-wasmsimd-c24.c | 98 const v128_t vaccGHIJ = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_low_i16x8(vaccGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 212 v128_t vaccGHIJ = wasm_v128_load(b + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local 357 v128_t vaccGHIJ = wasm_v128_load(buffer + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c24() local
|
D | 7p7x-minmax-fp32-sse41-c24.c | 99 __m128i vaccGHIJ = _mm_cvtepi16_epi32(vaccGHIJKLMN); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 223 __m128i vaccGHIJ = _mm_cvtepi16_epi32(vaccGHIJKLMN); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local 367 __m128i vaccGHIJ = _mm_cvtepi16_epi32(vaccGHIJKLMN); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c24() local
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 91 const int32x4_t vaccGHIJ = vaddw_s16(vinit_bias, vget_low_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 184 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 307 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
|
D | 7p7x-minmax-rndnu-neon-c24.c | 90 const int32x4_t vaccGHIJ = vaddw_s16(vinit_bias, vget_low_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 183 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 308 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-neon-c24.c | 90 const int32x4_t vaccGHIJ = vaddw_s16(vinit_bias, vget_low_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 183 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 307 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
|
D | 7p7x-minmax-fp32-wasmsimd-c32.c | 111 const v128_t vaccGHIJ = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_low_i16x8(vaccGHIJKLMN)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 242 v128_t vaccGHIJ = wasm_v128_load(b + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local 406 v128_t vaccGHIJ = wasm_v128_load(buffer + 16); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c32() local
|
D | 7p7x-minmax-rndnu-neon-c32.c | 103 const int32x4_t vaccGHIJ = vaddw_s16(vinit_bias, vget_low_s16(vsumGHIJKLMN)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 212 int32x4_t vaccGHIJ = vld1q_s32(b + 16); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 356 int32x4_t vaccGHIJ = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
|
/external/XNNPACK/src/qs8-vaddc/gen/ |
D | minmax-wasmsimd-x24.c | 43 …v128_t vaccGHIJ = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_low_i16x8(vaGHIJKLMN), va… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x24() local
|
D | minmax-avx-mul32-ld32-x24.c | 49 __m128i vaccGHIJ = _mm_add_epi32(vbias, _mm_mullo_epi32(vaGHIJ, va_multiplier)); in xnn_qs8_vaddc_minmax_ukernel__avx_mul32_ld32_x24() local
|
D | minmax-sse41-mul32-ld32-x24.c | 49 __m128i vaccGHIJ = _mm_add_epi32(vbias, _mm_mullo_epi32(vaGHIJ, va_multiplier)); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x24() local
|
D | minmax-xop-mul32-ld32-x24.c | 54 __m128i vaccGHIJ = _mm_macc_epi32(vaGHIJ, va_multiplier, vbias); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x24() local
|
D | minmax-wasmsimd-x32.c | 44 …v128_t vaccGHIJ = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_low_i16x8(vaGHIJKLMN), va… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32() local
|
D | minmax-neon-ld64-x24.c | 48 int32x4_t vaccGHIJ = vmlaq_s32(vbias, vmovl_s16(vget_low_s16(vxaGHIJKLMN)), va_multiplier); in xnn_qs8_vaddc_minmax_ukernel__neon_ld64_x24() local
|
/external/XNNPACK/src/qu8-vaddc/gen/ |
D | minmax-wasmsimd-x32.c | 44 …v128_t vaccGHIJ = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_u32x4_extend_low_u16x8(vaGHIJKLMN), va… in xnn_qu8_vaddc_minmax_ukernel__wasmsimd_x32() local
|
/external/XNNPACK/src/qs8-vadd/gen/ |
D | minmax-wasmsimd-x24.c | 46 …v128_t vaccGHIJ = wasm_i32x4_add(vbias, wasm_i32x4_mul(wasm_i32x4_extend_low_i16x8(vaGHIJKLMN), va… in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x24() local
|
/external/XNNPACK/src/f32-qs8-vcvt/gen/ |
D | vcvt-neonv8-x24.c | 53 const int32x4_t vaccGHIJ = vcvtnq_s32_f32(vxGHIJ); in xnn_f32_qs8_vcvt_ukernel__neonv8_x24() local
|
/external/XNNPACK/src/f32-qu8-vcvt/gen/ |
D | vcvt-neonv8-x24.c | 53 const int32x4_t vaccGHIJ = vcvtnq_s32_f32(vxGHIJ); in xnn_f32_qu8_vcvt_ukernel__neonv8_x24() local
|
D | vcvt-wasmsimd-cvt-x24.c | 61 v128_t vaccGHIJ = wasm_i32x4_trunc_sat_f32x4(vxGHIJ); in xnn_f32_qu8_vcvt_ukernel__wasmsimd_cvt_x24() local
|