/external/XNNPACK/src/f32-avgpool/ |
D | 9p8x-minmax-sse-c4.c | 106 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 109 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() 182 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 185 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() 281 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 284 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() 310 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 313 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4()
|
D | 9p8x-minmax-wasmsimd-arm-c4.c | 106 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 109 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 183 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 186 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 283 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 286 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 312 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 315 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4()
|
D | 9p8x-minmax-wasmsimd-x86-c4.c | 106 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 109 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 183 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 186 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 283 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 286 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 312 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 315 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4()
|
D | 9p8x-minmax-neon-c4.c | 97 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 100 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() 165 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 168 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() 256 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 259 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() 284 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 287 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4()
|
D | 9p8x-minmax-scalar-c1.c | 97 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1() local 100 const float vsum01678 = vsum018 + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1() 166 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1() local 169 const float vsum0167a = vsum01a + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1() 256 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1() local 259 const float vsum0167a = vsum01a + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__scalar_c1()
|
D | 9p8x-minmax-wasm-c1.c | 97 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1() local 100 const float vsum01678 = vsum018 + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1() 166 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1() local 169 const float vsum0167a = vsum01a + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1() 256 const float vsum67 = vi6 + vi7; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1() local 259 const float vsum0167a = vsum01a + vsum67; in xnn_f32_avgpool_minmax_ukernel_9p8x__wasm_c1()
|
D | 9x-minmax-wasmsimd-arm-c4.c | 130 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_arm_c4() local 133 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_arm_c4() 159 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_arm_c4() local 162 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_arm_c4()
|
D | 9x-minmax-wasmsimd-x86-c4.c | 130 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_x86_c4() local 133 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_x86_c4() 159 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_x86_c4() local 162 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__wasmsimd_x86_c4()
|
D | 9x-minmax-sse-c4.c | 130 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__sse_c4() local 133 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__sse_c4() 158 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__sse_c4() local 161 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__sse_c4()
|
D | 9x-minmax-neon-c4.c | 121 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__neon_c4() local 124 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__neon_c4() 149 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_avgpool_minmax_ukernel_9x__neon_c4() local 152 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_avgpool_minmax_ukernel_9x__neon_c4()
|
/external/XNNPACK/src/f32-pavgpool/ |
D | 9p8x-minmax-sse-c4.c | 106 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 109 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() 182 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 185 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() 284 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 287 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() 313 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 316 const __m128 vsum0167a = _mm_add_ps(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4()
|
D | 9p8x-minmax-neon-c4.c | 97 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 100 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() 165 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 168 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() 257 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 260 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() 285 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 288 const float32x4_t vsum0167a = vaddq_f32(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4()
|
D | 9p8x-minmax-wasmsimd-arm-c4.c | 106 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 109 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 183 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 186 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 286 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 289 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() 315 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 318 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4()
|
D | 9p8x-minmax-wasmsimd-x86-c4.c | 106 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 109 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 183 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 186 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 286 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 289 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() 315 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 318 const v128_t vsum0167a = wasm_f32x4_add(vsum01a, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4()
|
D | 9p8x-minmax-scalar-c1.c | 97 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local 100 const float vsum01678 = vsum018 + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() 166 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local 169 const float vsum0167a = vsum01a + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() 258 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local 261 const float vsum0167a = vsum01a + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1()
|
D | 9p8x-minmax-wasm-c1.c | 97 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local 100 const float vsum01678 = vsum018 + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() 166 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local 169 const float vsum0167a = vsum01a + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() 258 const float vsum67 = vi6 + vi7; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local 261 const float vsum0167a = vsum01a + vsum67; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1()
|
D | 9x-minmax-sse-c4.c | 133 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__sse_c4() local 136 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__sse_c4() 161 const __m128 vsum67 = _mm_add_ps(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__sse_c4() local 164 const __m128 vsum01678 = _mm_add_ps(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__sse_c4()
|
D | 9x-minmax-wasmsimd-x86-c4.c | 133 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_x86_c4() local 136 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_x86_c4() 162 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_x86_c4() local 165 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_x86_c4()
|
D | 9x-minmax-neon-c4.c | 123 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__neon_c4() local 126 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__neon_c4() 151 const float32x4_t vsum67 = vaddq_f32(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__neon_c4() local 154 const float32x4_t vsum01678 = vaddq_f32(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__neon_c4()
|
D | 9x-minmax-wasmsimd-arm-c4.c | 133 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_arm_c4() local 136 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_arm_c4() 162 const v128_t vsum67 = wasm_f32x4_add(vi6, vi7); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_arm_c4() local 165 const v128_t vsum01678 = wasm_f32x4_add(vsum018, vsum67); in xnn_f32_pavgpool_minmax_ukernel_9x__wasmsimd_arm_c4()
|
/external/XNNPACK/src/f16-pavgpool/ |
D | 9p8x-minmax-neonfp16arith-c8.c | 97 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 100 const float16x8_t vsum01678 = vaddq_f16(vsum018, vsum67); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 165 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 168 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 257 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 260 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 285 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 288 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8()
|
D | 9p8x-minmax-avx2-c8.c | 108 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 111 …const __m256 vsum01678 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum018, vsum67), _MM_FROUN… in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() 185 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 188 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() 288 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 291 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() 317 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 320 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8()
|
/external/XNNPACK/src/f16-avgpool/ |
D | 9p8x-minmax-neonfp16arith-c8.c | 97 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 100 const float16x8_t vsum01678 = vaddq_f16(vsum018, vsum67); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 165 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 168 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 256 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 259 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() 284 const float16x8_t vsum67 = vaddq_f16(vi6, vi7); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 287 const float16x8_t vsum0167a = vaddq_f16(vsum01a, vsum67); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8()
|
D | 9p8x-minmax-f16c-c8.c | 108 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 111 …const __m256 vsum01678 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum018, vsum67), _MM_FROUN… in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() 185 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 188 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() 286 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 289 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() 315 …const __m256 vsum67 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi6, vi7), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 318 …const __m256 vsum0167a = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vsum01a, vsum67), _MM_FROUN… in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8()
|
/external/XNNPACK/src/qu8-avgpool/ |
D | 9p8x-minmax-scalar-c1.c | 104 const uint32_t vsum67 = vi6 + vi7; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1() local 107 const uint32_t vsum01678 = vsum018 + vsum67; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1() 175 const uint32_t vsum67 = vi6 + vi7; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1() local 177 const uint32_t vsum4567 = vsum45 + vsum67; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1() 267 const uint32_t vsum67 = vi6 + vi7; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1() local 269 const uint32_t vsum4567 = vsum45 + vsum67; in xnn_qu8_avgpool_minmax_ukernel_9p8x__scalar_c1()
|