/external/XNNPACK/src/f32-vhswish/gen/ |
D | vhswish-sse-x8.c | 37 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); in xnn_f32_vhswish_ukernel__sse_x8() local 59 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); in xnn_f32_vhswish_ukernel__sse_x8() local 69 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); in xnn_f32_vhswish_ukernel__sse_x8() local
|
D | vhswish-sse-x4.c | 36 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); in xnn_f32_vhswish_ukernel__sse_x4() local 51 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); in xnn_f32_vhswish_ukernel__sse_x4() local
|
/external/XNNPACK/src/f32-qs8-vcvt/gen/ |
D | vcvt-avx512skx-x32.c | 46 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x32() local 68 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x32() local 91 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x32() local
|
D | vcvt-avx512skx-x64.c | 52 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x64() local 78 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x64() local 101 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x64() local
|
D | vcvt-avx512skx-x96.c | 59 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x96() local 93 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x96() local 116 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x96() local
|
D | vcvt-avx512skx-x128.c | 64 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x128() local 102 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x128() local 125 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qs8_vcvt_ukernel__avx512skx_x128() local
|
/external/XNNPACK/src/f32-qu8-vcvt/gen/ |
D | vcvt-avx512skx-x32.c | 46 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x32() local 68 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x32() local 91 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x32() local
|
D | vcvt-avx512skx-x64.c | 52 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x64() local 78 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x64() local 101 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x64() local
|
D | vcvt-avx512skx-x96.c | 59 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x96() local 93 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x96() local 116 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x96() local
|
D | vcvt-avx512skx-x128.c | 64 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x128() local 102 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x128() local 125 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); in xnn_f32_qu8_vcvt_ukernel__avx512skx_x128() local
|
/external/XNNPACK/src/f32-vhswish/ |
D | sse.c.in | 61 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); variable 71 __m128 vacc0123 = _mm_mul_ps(vx0123, vsixth); variable
|
/external/XNNPACK/src/f32-qs8-vcvt/ |
D | avx512skx.c.in | 107 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); variable 133 const __m512i vacc0123 = _mm512_cvtps_epi32(vx0123); variable
|
/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-rndnu-neon-c8.c | 60 …const int32x4_t vacc0123 = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 93 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 152 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 203 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local
|
D | 7p7x-minmax-fp32-wasmsimd-c8.c | 68 const v128_t vacc0123 = wasm_i32x4_add(vinit_bias, wasm_u32x4_extend_low_u16x8(vacc01234567)); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 112 v128_t vacc0123 = wasm_v128_load(b); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 180 v128_t vacc0123 = wasm_v128_load(buffer); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 237 v128_t vacc0123 = wasm_v128_load(buffer); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local
|
D | 7p7x-minmax-fp32-neonv8-c8.c | 61 …const int32x4_t vacc0123 = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 94 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 151 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 202 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local
|
D | 7p7x-minmax-fp32-sse41-c8.c | 70 __m128i vacc0123 = _mm_cvtepu16_epi32(vacc01234567); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 118 __m128i vacc0123 = _mm_cvtepu16_epi32(vacc01234567); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 186 __m128i vacc0123 = _mm_cvtepu16_epi32(vacc01234567); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 240 __m128i vacc0123 = _mm_cvtepu16_epi32(vacc01234567); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local
|
D | 7p7x-minmax-fp32-neon-c8.c | 60 …const int32x4_t vacc0123 = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget… in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 93 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 151 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 204 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local
|
/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-sse41-c8.c | 69 __m128i vacc0123 = _mm_cvtepi16_epi32(vacc01234567); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 116 __m128i vacc0123 = _mm_cvtepi16_epi32(vacc01234567); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 183 __m128i vacc0123 = _mm_cvtepi16_epi32(vacc01234567); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local 237 __m128i vacc0123 = _mm_cvtepi16_epi32(vacc01234567); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__sse41_c8() local
|
D | 7p7x-minmax-fp32-wasmsimd-c8.c | 68 const v128_t vacc0123 = wasm_i32x4_add(vinit_bias, wasm_i32x4_extend_low_i16x8(vacc01234567)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 112 v128_t vacc0123 = wasm_v128_load(b); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 180 v128_t vacc0123 = wasm_v128_load(buffer); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local 237 v128_t vacc0123 = wasm_v128_load(buffer); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__wasmsimd_c8() local
|
D | 7p7x-minmax-rndnu-neon-c8.c | 60 const int32x4_t vacc0123 = vaddw_s16(vinit_bias, vget_low_s16(vsum01234567)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 93 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 152 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local 203 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c8() local
|
D | 7p7x-minmax-fp32-neon-c8.c | 60 const int32x4_t vacc0123 = vaddw_s16(vinit_bias, vget_low_s16(vsum01234567)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 93 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 151 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local 204 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c8() local
|
D | 7p7x-minmax-fp32-neonv8-c8.c | 61 const int32x4_t vacc0123 = vaddw_s16(vinit_bias, vget_low_s16(vsum01234567)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 94 int32x4_t vacc0123 = vld1q_s32(b); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 151 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local 202 int32x4_t vacc0123 = vld1q_s32(buffer); buffer += 4; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c8() local
|
/external/XNNPACK/src/f32-dwconv/gen/ |
D | up8x3-wasmrelaxedsimd-fma.c | 87 const v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmrelaxedsimd_fma() local 118 const v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmrelaxedsimd_fma() local 139 v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmrelaxedsimd_fma() local
|
D | up8x3-wasmsimd.c | 87 const v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmsimd() local 118 const v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmsimd() local 139 v128_t vacc0123 = vacc0123p0; in xnn_f32_dwconv_ukernel_up8x3__wasmsimd() local
|
D | up8x3-minmax-sse.c | 89 __m128 vacc0123 = _mm_max_ps(vacc0123p0, vmin); in xnn_f32_dwconv_minmax_ukernel_up8x3__sse() local 122 __m128 vacc0123 = _mm_max_ps(vacc0123p0, vmin); in xnn_f32_dwconv_minmax_ukernel_up8x3__sse() local 144 __m128 vacc0123 = _mm_max_ps(vacc0123p0, vmin); in xnn_f32_dwconv_minmax_ukernel_up8x3__sse() local
|