/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-scalar-imagic-c1.c | 51 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local 84 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local
|
D | 7p7x-minmax-fp32-scalar-lrintf-c1.c | 52 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local 85 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local
|
D | 7p7x-minmax-fp32-scalar-fmagic-c1.c | 51 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local 84 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local
|
/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-scalar-fmagic-c1.c | 51 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local 84 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_fmagic_c1() local
|
D | 7p7x-minmax-fp32-scalar-lrintf-c1.c | 52 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local 85 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_lrintf_c1() local
|
D | 7p7x-minmax-fp32-scalar-imagic-c1.c | 51 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local 84 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local 138 const int32_t vi4 = (int32_t) *i4++; in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__scalar_imagic_c1() local
|
/external/XNNPACK/src/f32-gavgpool/ |
D | 7p7x-minmax-wasmsimd-arm-c4.c | 47 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 86 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 147 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 180 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local
|
D | 7p7x-minmax-wasmsimd-x86-c4.c | 47 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 86 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 147 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 180 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local
|
D | 7p7x-minmax-sse-c4.c | 47 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 85 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 146 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 179 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local
|
D | 7p7x-minmax-neon-c4.c | 43 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 74 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 128 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 156 const float32x4_t vi4 = vld1q_f32(i4); in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local
|
/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gavgpool/ |
D | mp8x7p7q-neon.c | 50 const uint8x8_t vi4 = vld1_u8(i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 93 const uint8x8_t vi4 = vld1_u8(i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 172 const uint8x8_t vi4 = vld1_u8(i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 246 const uint8x8_t vi4 = in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local
|
D | mp8x7p7q-sse2.c | 52 const __m128i vi4 = _mm_loadl_epi64((const __m128i*)i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__sse2() local 106 const __m128i vi4 = _mm_loadl_epi64((const __m128i*)i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__sse2() local 182 const __m128i vi4 = _mm_loadl_epi64((const __m128i*)i4); in pytorch_q8gavgpool_ukernel_mp8x7p7q__sse2() local 258 const __m128i vi4 = in pytorch_q8gavgpool_ukernel_mp8x7p7q__sse2() local
|
/external/XNNPACK/src/f32-maxpool/ |
D | 9p8x-minmax-sse-c4.c | 86 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__sse_c4() local 119 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__sse_c4() local 202 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__sse_c4() local 230 const __m128 vi4 = _mm_loadu_ps(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__sse_c4() local
|
D | 9p8x-minmax-wasmsimd-arm-c4.c | 86 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 119 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 201 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 229 const v128_t vi4 = wasm_v128_load(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local
|
D | 9p8x-minmax-neon-c4.c | 82 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_maxpool_minmax_ukernel_9p8x__neon_c4() local 105 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_maxpool_minmax_ukernel_9p8x__neon_c4() local 178 const float32x4_t vi4 = vld1q_f32(i4); i4 += 4; in xnn_f32_maxpool_minmax_ukernel_9p8x__neon_c4() local 201 const float32x4_t vi4 = vld1q_f32(i4); in xnn_f32_maxpool_minmax_ukernel_9p8x__neon_c4() local
|
/external/XNNPACK/src/f16-maxpool/ |
D | 9p8x-minmax-neonfp16arith-c8.c | 82 const float16x8_t vi4 = vld1q_f16(i4); i4 += 8; in xnn_f16_maxpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 105 const float16x8_t vi4 = vld1q_f16(i4); i4 += 8; in xnn_f16_maxpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 182 const float16x8_t vi4 = vld1q_f16(i4); i4 += 8; in xnn_f16_maxpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 205 const float16x8_t vi4 = vld1q_f16(i4); in xnn_f16_maxpool_minmax_ukernel_9p8x__neonfp16arith_c8() local
|
D | 9p8x-minmax-f16c-c8.c | 87 const __m256 vi4 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) i4)); in xnn_f16_maxpool_minmax_ukernel_9p8x__f16c_c8() local 120 const __m256 vi4 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) i4)); in xnn_f16_maxpool_minmax_ukernel_9p8x__f16c_c8() local 209 const __m256 vi4 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) i4)); in xnn_f16_maxpool_minmax_ukernel_9p8x__f16c_c8() local 237 const __m256 vi4 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) i4)); in xnn_f16_maxpool_minmax_ukernel_9p8x__f16c_c8() local
|
/external/XNNPACK/src/s8-maxpool/ |
D | 9p8x-minmax-wasmsimd-c16.c | 87 const v128_t vi4 = wasm_v128_load(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__wasmsimd_c16() local 116 const v128_t vi4 = wasm_v128_load(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__wasmsimd_c16() local 206 const v128_t vi4 = wasm_v128_load(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__wasmsimd_c16() local 235 const v128_t vi4 = wasm_v128_load(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__wasmsimd_c16() local
|
D | 9p8x-minmax-sse2-c16.c | 89 const __m128i vi4 = _mm_xor_si128(_mm_loadu_si128((const __m128i*) i4), vbias); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 119 const __m128i vi4 = _mm_xor_si128(_mm_loadu_si128((const __m128i*) i4), vbias); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 209 const __m128i vi4 = _mm_xor_si128(_mm_loadu_si128((const __m128i*) i4), vbias); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 239 const __m128i vi4 = _mm_xor_si128(_mm_loadu_si128((const __m128i*) i4), vbias); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse2_c16() local
|
D | 9p8x-minmax-neon-c16.c | 82 const int8x16_t vi4 = vld1q_s8(i4); i4 += 16; in xnn_s8_maxpool_minmax_ukernel_9p8x__neon_c16() local 106 const int8x16_t vi4 = vld1q_s8(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__neon_c16() local 188 const int8x16_t vi4 = vld1q_s8(i4); i4 += 16; in xnn_s8_maxpool_minmax_ukernel_9p8x__neon_c16() local 212 const int8x16_t vi4 = vld1q_s8(i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__neon_c16() local
|
D | 9p8x-minmax-sse41-c16.c | 84 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); i4 += 16; in xnn_s8_maxpool_minmax_ukernel_9p8x__sse41_c16() local 108 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse41_c16() local 193 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); i4 += 16; in xnn_s8_maxpool_minmax_ukernel_9p8x__sse41_c16() local 218 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); in xnn_s8_maxpool_minmax_ukernel_9p8x__sse41_c16() local
|
/external/XNNPACK/src/u8-maxpool/ |
D | 9p8x-minmax-sse2-c16.c | 87 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); i4 += 16; in xnn_u8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 111 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); in xnn_u8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 196 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); i4 += 16; in xnn_u8_maxpool_minmax_ukernel_9p8x__sse2_c16() local 221 const __m128i vi4 = _mm_loadu_si128((const __m128i*) i4); in xnn_u8_maxpool_minmax_ukernel_9p8x__sse2_c16() local
|
D | 9p8x-minmax-neon-c16.c | 85 const uint8x16_t vi4 = vld1q_u8(i4); i4 += 16; in xnn_u8_maxpool_minmax_ukernel_9p8x__neon_c16() local 108 const uint8x16_t vi4 = vld1q_u8(i4); in xnn_u8_maxpool_minmax_ukernel_9p8x__neon_c16() local 189 const uint8x16_t vi4 = vld1q_u8(i4); i4 += 16; in xnn_u8_maxpool_minmax_ukernel_9p8x__neon_c16() local 212 const uint8x16_t vi4 = vld1q_u8(i4); in xnn_u8_maxpool_minmax_ukernel_9p8x__neon_c16() local
|
/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/u8maxpool/ |
D | 16x9p8q-neon.c | 77 const uint8x16_t vi4 = vld1q_u8(i4); in pytorch_u8maxpool_ukernel_16x9p8q__neon() local 121 const uint8x16_t vi4 = vld1q_u8(i4); in pytorch_u8maxpool_ukernel_16x9p8q__neon() local 185 const uint8x16_t vi4 = vld1q_u8(i4); in pytorch_u8maxpool_ukernel_16x9p8q__neon() local 227 const uint8x16_t vi4 = vld1q_u8(i4); in pytorch_u8maxpool_ukernel_16x9p8q__neon() local
|
D | 16x9p8q-sse2.c | 80 const __m128i vi4 = _mm_loadu_si128((const __m128i*)i4); in pytorch_u8maxpool_ukernel_16x9p8q__sse2() local 124 const __m128i vi4 = _mm_loadu_si128((const __m128i*)i4); in pytorch_u8maxpool_ukernel_16x9p8q__sse2() local 188 const __m128i vi4 = _mm_loadu_si128((const __m128i*)i4); in pytorch_u8maxpool_ukernel_16x9p8q__sse2() local 230 const __m128i vi4 = _mm_loadu_si128((const __m128i*)i4); in pytorch_u8maxpool_ukernel_16x9p8q__sse2() local
|