Home
last modified time | relevance | path

Searched defs:vk0x01234567 (Results 1 – 25 of 337) sorted by relevance

12345678910>>...14

/external/XNNPACK/src/f32-dwconv/gen/
Dup16x3-minmax-avx.c63 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx() local
104 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx() local
136 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx() local
Dup16x3-minmax-fma3.c63 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3() local
104 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3() local
136 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3() local
Dup16x3-minmax-fma3-acc2.c63 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
107 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
141 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
Dup16x3-minmax-avx-acc2.c63 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx_acc2() local
107 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx_acc2() local
141 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x3__avx_acc2() local
Dup16x4-minmax-fma3.c68 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3() local
118 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3() local
156 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3() local
Dup16x4-minmax-avx.c68 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx() local
118 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx() local
156 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx() local
Dup16x4-minmax-fma3-acc2.c68 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
121 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
161 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
Dup16x4-minmax-avx-acc2.c68 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx_acc2() local
121 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx_acc2() local
161 const __m256 vk0x01234567 = _mm256_load_ps(w + 16); in xnn_f32_dwconv_minmax_ukernel_up16x4__avx_acc2() local
Dup8x3-minmax-fma3.c61 const __m256 vk0x01234567 = _mm256_load_ps(w + 8); in xnn_f32_dwconv_minmax_ukernel_up8x3__fma3() local
93 const __m256 vk0x01234567 = _mm256_load_ps(w + 8); in xnn_f32_dwconv_minmax_ukernel_up8x3__fma3() local
Dup8x3-minmax-avx.c61 const __m256 vk0x01234567 = _mm256_load_ps(w + 8); in xnn_f32_dwconv_minmax_ukernel_up8x3__avx() local
93 const __m256 vk0x01234567 = _mm256_load_ps(w + 8); in xnn_f32_dwconv_minmax_ukernel_up8x3__avx() local
/external/XNNPACK/src/f16-dwconv/gen/
Dup16x3-minmax-fma3.c66 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3() local
107 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3() local
139 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3() local
Dup16x3-minmax-neonfp16arith.c63 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith() local
96 const float16x8_t vk0x01234567 = vld1q_f16(w + 8); in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith() local
118 const float16x8_t vk0x01234567 = vld1q_f16(w + 16); in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith() local
Dup16x3-minmax-neonfp16arith-acc2.c63 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith_acc2() local
99 const float16x8_t vk0x01234567 = vld1q_f16(w + 8); in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith_acc2() local
123 const float16x8_t vk0x01234567 = vld1q_f16(w + 16); in xnn_f16_dwconv_minmax_ukernel_up16x3__neonfp16arith_acc2() local
Dup16x3-minmax-fma3-acc2.c66 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
110 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
144 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x3__fma3_acc2() local
Dup16x4-minmax-neonfp16arith.c68 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith() local
108 const float16x8_t vk0x01234567 = vld1q_f16(w + 8); in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith() local
134 const float16x8_t vk0x01234567 = vld1q_f16(w + 16); in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith() local
Dup16x4-minmax-fma3.c71 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3() local
121 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3() local
159 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3() local
Dup16x4-minmax-neonfp16arith-acc2.c68 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith_acc2() local
111 const float16x8_t vk0x01234567 = vld1q_f16(w + 8); in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith_acc2() local
139 const float16x8_t vk0x01234567 = vld1q_f16(w + 16); in xnn_f16_dwconv_minmax_ukernel_up16x4__neonfp16arith_acc2() local
Dup16x4-minmax-fma3-acc2.c71 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
124 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
164 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 16))); in xnn_f16_dwconv_minmax_ukernel_up16x4__fma3_acc2() local
Dup32x3-minmax-fma3.c70 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3() local
133 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3() local
165 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3() local
Dup32x3-minmax-neonfp16arith.c67 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith() local
122 const float16x8_t vk0x01234567 = vld1q_f16(w + 24); in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith() local
144 const float16x8_t vk0x01234567 = vld1q_f16(w + 32); in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith() local
Dup8x3-minmax-neonfp16arith.c61 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up8x3__neonfp16arith() local
83 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up8x3__neonfp16arith() local
Dup8x3-minmax-fma3.c64 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 8))); in xnn_f16_dwconv_minmax_ukernel_up8x3__fma3() local
96 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 8))); in xnn_f16_dwconv_minmax_ukernel_up8x3__fma3() local
Dup32x3-minmax-neonfp16arith-acc2.c67 const float16x8_t vk0x01234567 = vld1q_f16(w); w += 8; in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith_acc2() local
127 const float16x8_t vk0x01234567 = vld1q_f16(w + 24); in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith_acc2() local
151 const float16x8_t vk0x01234567 = vld1q_f16(w + 32); in xnn_f16_dwconv_minmax_ukernel_up32x3__neonfp16arith_acc2() local
Dup32x3-minmax-fma3-acc2.c70 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3_acc2() local
138 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3_acc2() local
172 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 32))); in xnn_f16_dwconv_minmax_ukernel_up32x3__fma3_acc2() local
Dup8x3-minmax-fma3-acc2.c64 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_loadu_si128((const __m128i*) (w + 8))); in xnn_f16_dwconv_minmax_ukernel_up8x3__fma3_acc2() local
98 const __m256 vk0x01234567 = _mm256_cvtph_ps(_mm_load_si128((const __m128i*) (w + 8))); in xnn_f16_dwconv_minmax_ukernel_up8x3__fma3_acc2() local

12345678910>>...14