Home
last modified time | relevance | path

Searched refs:vy_lo (Results 1 – 25 of 181) sorted by relevance

12345678

/external/XNNPACK/src/f32-vsqrt/gen/
Davx-sqrt-x8.c45 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8() local
47 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8()
48 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8()
52 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8()
53 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8()
57 _mm_store_ss(y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x8()
Davx-sqrt-x16.c57 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16() local
59 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16()
60 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16()
64 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16()
65 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16()
69 _mm_store_ss(y, vy_lo); in xnn_f32_vsqrt_ukernel__avx_sqrt_x16()
/external/XNNPACK/src/f32-vrnd/gen/
Dvrndu-avx-x8.c48 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndu_ukernel__avx_x8() local
50 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x8()
51 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndu_ukernel__avx_x8()
55 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x8()
56 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndu_ukernel__avx_x8()
60 _mm_store_ss(y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x8()
Dvrndne-avx-x8.c48 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndne_ukernel__avx_x8() local
50 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x8()
51 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndne_ukernel__avx_x8()
55 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x8()
56 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndne_ukernel__avx_x8()
60 _mm_store_ss(y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x8()
Dvrndd-avx-x8.c48 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndd_ukernel__avx_x8() local
50 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x8()
51 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndd_ukernel__avx_x8()
55 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x8()
56 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndd_ukernel__avx_x8()
60 _mm_store_ss(y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x8()
Dvrndz-avx-x8.c48 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndz_ukernel__avx_x8() local
50 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x8()
51 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndz_ukernel__avx_x8()
55 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x8()
56 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndz_ukernel__avx_x8()
60 _mm_store_ss(y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x8()
Dvrndz-avx-x16.c60 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndz_ukernel__avx_x16() local
62 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x16()
63 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndz_ukernel__avx_x16()
67 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x16()
68 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndz_ukernel__avx_x16()
72 _mm_store_ss(y, vy_lo); in xnn_f32_vrndz_ukernel__avx_x16()
Dvrndd-avx-x16.c60 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndd_ukernel__avx_x16() local
62 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x16()
63 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndd_ukernel__avx_x16()
67 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x16()
68 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndd_ukernel__avx_x16()
72 _mm_store_ss(y, vy_lo); in xnn_f32_vrndd_ukernel__avx_x16()
Dvrndne-avx-x16.c60 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndne_ukernel__avx_x16() local
62 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x16()
63 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndne_ukernel__avx_x16()
67 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x16()
68 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndne_ukernel__avx_x16()
72 _mm_store_ss(y, vy_lo); in xnn_f32_vrndne_ukernel__avx_x16()
Dvrndu-avx-x16.c60 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vrndu_ukernel__avx_x16() local
62 _mm_storeu_ps(y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x16()
63 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vrndu_ukernel__avx_x16()
67 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x16()
68 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vrndu_ukernel__avx_x16()
72 _mm_store_ss(y, vy_lo); in xnn_f32_vrndu_ukernel__avx_x16()
/external/XNNPACK/src/f32-vunary/gen/
Dvsqr-avx-x8.c49 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqr_ukernel__avx_x8() local
51 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x8()
52 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqr_ukernel__avx_x8()
56 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x8()
57 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqr_ukernel__avx_x8()
61 _mm_store_ss(y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x8()
Dvabs-avx-x8.c50 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vabs_ukernel__avx_x8() local
52 _mm_storeu_ps(y, vy_lo); in xnn_f32_vabs_ukernel__avx_x8()
53 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vabs_ukernel__avx_x8()
57 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vabs_ukernel__avx_x8()
58 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vabs_ukernel__avx_x8()
62 _mm_store_ss(y, vy_lo); in xnn_f32_vabs_ukernel__avx_x8()
Dvneg-avx-x8.c50 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vneg_ukernel__avx_x8() local
52 _mm_storeu_ps(y, vy_lo); in xnn_f32_vneg_ukernel__avx_x8()
53 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vneg_ukernel__avx_x8()
57 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vneg_ukernel__avx_x8()
58 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vneg_ukernel__avx_x8()
62 _mm_store_ss(y, vy_lo); in xnn_f32_vneg_ukernel__avx_x8()
Dvsqr-avx-x16.c59 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqr_ukernel__avx_x16() local
61 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x16()
62 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqr_ukernel__avx_x16()
66 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x16()
67 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqr_ukernel__avx_x16()
71 _mm_store_ss(y, vy_lo); in xnn_f32_vsqr_ukernel__avx_x16()
Dvabs-avx-x16.c60 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vabs_ukernel__avx_x16() local
62 _mm_storeu_ps(y, vy_lo); in xnn_f32_vabs_ukernel__avx_x16()
63 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vabs_ukernel__avx_x16()
67 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vabs_ukernel__avx_x16()
68 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vabs_ukernel__avx_x16()
72 _mm_store_ss(y, vy_lo); in xnn_f32_vabs_ukernel__avx_x16()
/external/XNNPACK/src/f32-vbinary/gen/
Dvminc-avx-x8.c56 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vminc_ukernel__avx_x8() local
58 _mm_storeu_ps(y, vy_lo); in xnn_f32_vminc_ukernel__avx_x8()
59 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vminc_ukernel__avx_x8()
63 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vminc_ukernel__avx_x8()
64 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vminc_ukernel__avx_x8()
68 _mm_store_ss(y, vy_lo); in xnn_f32_vminc_ukernel__avx_x8()
Dvmaxc-avx-x8.c56 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vmaxc_ukernel__avx_x8() local
58 _mm_storeu_ps(y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x8()
59 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vmaxc_ukernel__avx_x8()
63 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x8()
64 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x8()
68 _mm_store_ss(y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x8()
Dvmin-avx-x8.c59 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vmin_ukernel__avx_x8() local
61 _mm_storeu_ps(y, vy_lo); in xnn_f32_vmin_ukernel__avx_x8()
62 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vmin_ukernel__avx_x8()
66 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vmin_ukernel__avx_x8()
67 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vmin_ukernel__avx_x8()
71 _mm_store_ss(y, vy_lo); in xnn_f32_vmin_ukernel__avx_x8()
Dvmax-avx-x8.c59 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vmax_ukernel__avx_x8() local
61 _mm_storeu_ps(y, vy_lo); in xnn_f32_vmax_ukernel__avx_x8()
62 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vmax_ukernel__avx_x8()
66 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vmax_ukernel__avx_x8()
67 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vmax_ukernel__avx_x8()
71 _mm_store_ss(y, vy_lo); in xnn_f32_vmax_ukernel__avx_x8()
Dvsqrdiffc-avx-x8.c58 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqrdiffc_ukernel__avx_x8() local
60 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqrdiffc_ukernel__avx_x8()
61 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqrdiffc_ukernel__avx_x8()
65 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqrdiffc_ukernel__avx_x8()
66 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqrdiffc_ukernel__avx_x8()
70 _mm_store_ss(y, vy_lo); in xnn_f32_vsqrdiffc_ukernel__avx_x8()
Dvsqrdiff-avx-x8.c61 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsqrdiff_ukernel__avx_x8() local
63 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsqrdiff_ukernel__avx_x8()
64 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsqrdiff_ukernel__avx_x8()
68 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsqrdiff_ukernel__avx_x8()
69 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsqrdiff_ukernel__avx_x8()
73 _mm_store_ss(y, vy_lo); in xnn_f32_vsqrdiff_ukernel__avx_x8()
Dvsubc-minmax-avx-x8.c63 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vsubc_minmax_ukernel__avx_x8() local
65 _mm_storeu_ps(y, vy_lo); in xnn_f32_vsubc_minmax_ukernel__avx_x8()
66 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vsubc_minmax_ukernel__avx_x8()
70 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vsubc_minmax_ukernel__avx_x8()
71 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vsubc_minmax_ukernel__avx_x8()
75 _mm_store_ss(y, vy_lo); in xnn_f32_vsubc_minmax_ukernel__avx_x8()
Dvmaxc-avx-x16.c67 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vmaxc_ukernel__avx_x16() local
69 _mm_storeu_ps(y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x16()
70 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vmaxc_ukernel__avx_x16()
74 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x16()
75 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x16()
79 _mm_store_ss(y, vy_lo); in xnn_f32_vmaxc_ukernel__avx_x16()
Dvdivc-minmax-avx-x8.c63 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vdivc_minmax_ukernel__avx_x8() local
65 _mm_storeu_ps(y, vy_lo); in xnn_f32_vdivc_minmax_ukernel__avx_x8()
66 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vdivc_minmax_ukernel__avx_x8()
70 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vdivc_minmax_ukernel__avx_x8()
71 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vdivc_minmax_ukernel__avx_x8()
75 _mm_store_ss(y, vy_lo); in xnn_f32_vdivc_minmax_ukernel__avx_x8()
Dvminc-avx-x16.c67 __m128 vy_lo = _mm256_castps256_ps128(vy); in xnn_f32_vminc_ukernel__avx_x16() local
69 _mm_storeu_ps(y, vy_lo); in xnn_f32_vminc_ukernel__avx_x16()
70 vy_lo = _mm256_extractf128_ps(vy, 1); in xnn_f32_vminc_ukernel__avx_x16()
74 _mm_storel_pi((__m64*) y, vy_lo); in xnn_f32_vminc_ukernel__avx_x16()
75 vy_lo = _mm_movehl_ps(vy_lo, vy_lo); in xnn_f32_vminc_ukernel__avx_x16()
79 _mm_store_ss(y, vy_lo); in xnn_f32_vminc_ukernel__avx_x16()

12345678