Home
last modified time | relevance | path

Searched refs:_mm_store_ss (Results 1 – 25 of 351) sorted by relevance

12345678910>>...15

/external/XNNPACK/src/f32-igemm/gen/
D8x8-fma3-broadcast.c269 _mm_store_ss(c7, vacc7x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
270 _mm_store_ss(c6, vacc6x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
271 _mm_store_ss(c5, vacc5x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
272 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
273 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
274 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
275 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
276 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_8x8__fma3_broadcast()
D7x8-fma3-broadcast.c245 _mm_store_ss(c6, vacc6x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
246 _mm_store_ss(c5, vacc5x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
247 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
248 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
249 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
250 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
251 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_7x8__fma3_broadcast()
D7x8-avx-broadcast.c245 _mm_store_ss(c6, vacc6x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
246 _mm_store_ss(c5, vacc5x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
247 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
248 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
249 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
250 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
251 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_7x8__avx_broadcast()
D6x8-fma3-broadcast.c221 _mm_store_ss(c5, vacc5x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
222 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
223 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
224 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
225 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
226 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_6x8__fma3_broadcast()
D6x8-avx-broadcast.c221 _mm_store_ss(c5, vacc5x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
222 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
223 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
224 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
225 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
226 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_6x8__avx_broadcast()
D5x8-fma3-broadcast.c197 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_5x8__fma3_broadcast()
198 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_5x8__fma3_broadcast()
199 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_5x8__fma3_broadcast()
200 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_5x8__fma3_broadcast()
201 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_5x8__fma3_broadcast()
D5x8-avx-broadcast.c197 _mm_store_ss(c4, vacc4x0123); in xnn_f32_igemm_ukernel_5x8__avx_broadcast()
198 _mm_store_ss(c3, vacc3x0123); in xnn_f32_igemm_ukernel_5x8__avx_broadcast()
199 _mm_store_ss(c2, vacc2x0123); in xnn_f32_igemm_ukernel_5x8__avx_broadcast()
200 _mm_store_ss(c1, vacc1x0123); in xnn_f32_igemm_ukernel_5x8__avx_broadcast()
201 _mm_store_ss(c0, vacc0x0123); in xnn_f32_igemm_ukernel_5x8__avx_broadcast()
/external/XNNPACK/src/f32-gemm/gen-inc/
D8x8-fma3-broadcast.c244 _mm_store_ss(c7, vacc7x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
245 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
246 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
247 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
248 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
249 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
250 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
251 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_8x8__fma3_broadcast()
D7x8-avx-broadcast.c222 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
223 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
224 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
225 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
226 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
227 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
228 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_7x8__avx_broadcast()
D7x8-fma3-broadcast.c222 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
223 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
224 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
225 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
226 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
227 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
228 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_7x8__fma3_broadcast()
D6x8-fma3-broadcast.c200 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
201 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
202 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
203 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
204 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
205 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_6x8__fma3_broadcast()
D6x8-avx-broadcast.c200 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
201 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
202 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
203 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
204 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
205 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_6x8__avx_broadcast()
D5x8-avx-broadcast.c178 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_5x8__avx_broadcast()
179 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_5x8__avx_broadcast()
180 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_5x8__avx_broadcast()
181 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_5x8__avx_broadcast()
182 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_5x8__avx_broadcast()
D5x8-fma3-broadcast.c178 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemminc_ukernel_5x8__fma3_broadcast()
179 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_5x8__fma3_broadcast()
180 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_5x8__fma3_broadcast()
181 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_5x8__fma3_broadcast()
182 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_5x8__fma3_broadcast()
D4x8-fma3-broadcast.c156 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemminc_ukernel_4x8__fma3_broadcast()
157 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemminc_ukernel_4x8__fma3_broadcast()
158 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemminc_ukernel_4x8__fma3_broadcast()
159 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemminc_ukernel_4x8__fma3_broadcast()
/external/XNNPACK/src/f32-gemm/gen/
D8x8-fma3-broadcast.c242 _mm_store_ss(c7, vacc7x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
243 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
244 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
245 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
246 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
247 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
248 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
249 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_8x8__fma3_broadcast()
D7x8-fma3-broadcast.c220 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
221 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
222 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
223 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
224 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
225 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
226 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_7x8__fma3_broadcast()
D7x8-avx-broadcast.c220 _mm_store_ss(c6, vacc6x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
221 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
222 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
223 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
224 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
225 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
226 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_7x8__avx_broadcast()
D6x8-avx-broadcast.c198 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
199 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
200 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
201 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
202 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
203 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_6x8__avx_broadcast()
D6x8-fma3-broadcast.c198 _mm_store_ss(c5, vacc5x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
199 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
200 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
201 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
202 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
203 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_6x8__fma3_broadcast()
D5x8-fma3-broadcast.c176 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_5x8__fma3_broadcast()
177 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_5x8__fma3_broadcast()
178 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_5x8__fma3_broadcast()
179 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_5x8__fma3_broadcast()
180 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_5x8__fma3_broadcast()
D5x8-avx-broadcast.c176 _mm_store_ss(c4, vacc4x0123); in xnn_f32_gemm_ukernel_5x8__avx_broadcast()
177 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_5x8__avx_broadcast()
178 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_5x8__avx_broadcast()
179 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_5x8__avx_broadcast()
180 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_5x8__avx_broadcast()
D4x8-fma3-broadcast.c154 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_4x8__fma3_broadcast()
155 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_4x8__fma3_broadcast()
156 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_4x8__fma3_broadcast()
157 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_4x8__fma3_broadcast()
D4x8-avx-broadcast.c154 _mm_store_ss(c3, vacc3x0123); in xnn_f32_gemm_ukernel_4x8__avx_broadcast()
155 _mm_store_ss(c2, vacc2x0123); in xnn_f32_gemm_ukernel_4x8__avx_broadcast()
156 _mm_store_ss(c1, vacc1x0123); in xnn_f32_gemm_ukernel_4x8__avx_broadcast()
157 _mm_store_ss(c0, vacc0x0123); in xnn_f32_gemm_ukernel_4x8__avx_broadcast()
/external/XNNPACK/src/x32-zip/
Dx3-sse2.c84 _mm_store_ss(o, vx); in xnn_x32_zip_x3_ukernel__sse2()
85 _mm_store_ss(o + 1, vy); in xnn_x32_zip_x3_ukernel__sse2()
86 _mm_store_ss(o + 2, vz); in xnn_x32_zip_x3_ukernel__sse2()

12345678910>>...15