Home
last modified time | relevance | path

Searched refs:_mm256_castsi256_si128 (Results 1 – 22 of 22) sorted by relevance

/external/libvpx/libvpx/vpx_dsp/x86/
Dconvolve_avx2.h80 const __m128i x0 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[0]), in convolve8_8_avx2()
81 _mm256_castsi256_si128(f[0])); in convolve8_8_avx2()
82 const __m128i x1 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[1]), in convolve8_8_avx2()
83 _mm256_castsi256_si128(f[1])); in convolve8_8_avx2()
84 const __m128i x2 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[2]), in convolve8_8_avx2()
85 _mm256_castsi256_si128(f[2])); in convolve8_8_avx2()
86 const __m128i x3 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[3]), in convolve8_8_avx2()
87 _mm256_castsi256_si128(f[3])); in convolve8_8_avx2()
Dvpx_subpixel_8t_intrin_avx2.c99 outReg1 = _mm256_castsi256_si128(outReg32b1); in vpx_filter_block1d16_h8_x_avx2()
126 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[0]))); in vpx_filter_block1d16_h8_x_avx2()
128 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[1]))); in vpx_filter_block1d16_h8_x_avx2()
130 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[2]))); in vpx_filter_block1d16_h8_x_avx2()
132 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[3]))); in vpx_filter_block1d16_h8_x_avx2()
141 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[0]))); in vpx_filter_block1d16_h8_x_avx2()
143 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[1]))); in vpx_filter_block1d16_h8_x_avx2()
145 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[2]))); in vpx_filter_block1d16_h8_x_avx2()
147 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[3]))); in vpx_filter_block1d16_h8_x_avx2()
215 _mm256_castsi256_si128(srcRegHead1), 1); in vpx_filter_block1d16_v8_x_avx2()
[all …]
Dloopfilter_avx2.c410 p4 = _mm256_castsi256_si128(p256_4); in vpx_lpf_horizontal_16_dual_avx2()
411 p3 = _mm256_castsi256_si128(p256_3); in vpx_lpf_horizontal_16_dual_avx2()
412 p2 = _mm256_castsi256_si128(p256_2); in vpx_lpf_horizontal_16_dual_avx2()
413 p1 = _mm256_castsi256_si128(p256_1); in vpx_lpf_horizontal_16_dual_avx2()
414 p0 = _mm256_castsi256_si128(p256_0); in vpx_lpf_horizontal_16_dual_avx2()
415 q0 = _mm256_castsi256_si128(q256_0); in vpx_lpf_horizontal_16_dual_avx2()
416 q1 = _mm256_castsi256_si128(q256_1); in vpx_lpf_horizontal_16_dual_avx2()
417 q2 = _mm256_castsi256_si128(q256_2); in vpx_lpf_horizontal_16_dual_avx2()
418 q3 = _mm256_castsi256_si128(q256_3); in vpx_lpf_horizontal_16_dual_avx2()
419 q4 = _mm256_castsi256_si128(q256_4); in vpx_lpf_horizontal_16_dual_avx2()
[all …]
Dsad_avx2.c37 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \
69 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \
120 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \
158 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \
Dhighbd_convolve_avx2.c315 const __m128i a0 = _mm256_castsi256_si128(*y); in store_8x1_pixels()
318 res = _mm_min_epi16(res, _mm256_castsi256_si128(*mask)); in store_8x1_pixels()
327 _mm_storeu_si128((__m128i *)dst, _mm256_castsi256_si128(a)); in store_8x2_pixels()
522 s0 = _mm256_inserti128_si256(s0, _mm256_castsi256_si128(s1), 1); in pack_8x9_init()
523 s1 = _mm256_inserti128_si256(s1, _mm256_castsi256_si128(s2), 1); in pack_8x9_init()
524 s2 = _mm256_inserti128_si256(s2, _mm256_castsi256_si128(s3), 1); in pack_8x9_init()
525 s3 = _mm256_inserti128_si256(s3, _mm256_castsi256_si128(s4), 1); in pack_8x9_init()
526 s4 = _mm256_inserti128_si256(s4, _mm256_castsi256_si128(s5), 1); in pack_8x9_init()
527 s5 = _mm256_inserti128_si256(s5, _mm256_castsi256_si128(s6), 1); in pack_8x9_init()
546 __m256i s2 = _mm256_inserti128_si256(sig[8], _mm256_castsi256_si128(s0), 1); in pack_8x9_pixels()
[all …]
Dsad4d_avx2.c75 sum = _mm_add_epi32(_mm256_castsi256_si128(sum_mlow), in vpx_sad32x32x4d_avx2()
159 sum = _mm_add_epi32(_mm256_castsi256_si128(sum_mlow), in vpx_sad64x64x4d_avx2()
Dvariance_avx2.c75 _mm256_castsi256_si128(sum_reg), _mm256_extractf128_si256(sum_reg, 1)); in vpx_get16x16var_avx2()
77 _mm256_castsi256_si128(sse_reg), _mm256_extractf128_si256(sse_reg, 1)); in vpx_get16x16var_avx2()
144 _mm256_castsi256_si128(sum_reg), _mm256_extractf128_si256(sum_reg, 1)); in get32x16var_avx2()
146 _mm256_castsi256_si128(sse_reg), _mm256_extractf128_si256(sse_reg, 1)); in get32x16var_avx2()
208 *((int *)sse) = _mm_cvtsi128_si32(_mm256_castsi256_si128(sse_reg)) + \
212 sum = _mm_cvtsi128_si32(_mm256_castsi256_si128(sum_reg)) + \
Dsad4d_avx512.c78 sum128 = _mm_add_epi32(_mm256_castsi256_si128(sum256), in vpx_sad64x64x4d_avx512()
Davg_intrin_avx2.c193 const __m128i accum_128 = _mm_add_epi32(_mm256_castsi256_si128(d), in vpx_satd_avx2()
Dfwd_dct32x32_impl_avx2.h2963 _mm256_castsi256_si128(tr2_0)); in FDCT32x32_2D_AVX2()
2965 _mm256_castsi256_si128(tr2_1)); in FDCT32x32_2D_AVX2()
2967 _mm256_castsi256_si128(tr2_2)); in FDCT32x32_2D_AVX2()
2969 _mm256_castsi256_si128(tr2_3)); in FDCT32x32_2D_AVX2()
2971 _mm256_castsi256_si128(tr2_4)); in FDCT32x32_2D_AVX2()
2973 _mm256_castsi256_si128(tr2_5)); in FDCT32x32_2D_AVX2()
2975 _mm256_castsi256_si128(tr2_6)); in FDCT32x32_2D_AVX2()
2977 _mm256_castsi256_si128(tr2_7)); in FDCT32x32_2D_AVX2()
/external/libvpx/libvpx/vp9/encoder/x86/
Dvp9_error_avx2.c96 sse_128 = _mm_add_epi64(_mm256_castsi256_si128(sse_256), in vp9_block_error_avx2()
99 ssz_128 = _mm_add_epi64(_mm256_castsi256_si128(ssz_256), in vp9_block_error_avx2()
155 sse_128 = _mm_add_epi64(_mm256_castsi256_si128(sse_256), in vp9_block_error_fp_avx2()
/external/flac/libFLAC/
Dstream_encoder_intrin_avx2.c74 sum128 = _mm_add_epi32(_mm256_extracti128_si256(sum256, 1), _mm256_castsi256_si128(sum256)); in FLAC__precompute_partition_info_sums_intrin_avx2()
107 sum128 = _mm_add_epi64(_mm256_extracti128_si256(sum256, 1), _mm256_castsi256_si128(sum256)); in FLAC__precompute_partition_info_sums_intrin_avx2()
Dlpc_intrin_avx2.c807 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
838 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
869 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
896 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
925 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
948 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
971 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
990 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
1011 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
1026 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2()
[all …]
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/
Dsimdintrin.h106 __m128i aLo = _mm256_castsi256_si128(a);\
107 __m128i bLo = _mm256_castsi256_si128(b);\
125 __m128i bLo = _mm256_castsi256_si128(b); in _simdemu_permute_ps()
405 __m128i aLo = _mm256_castsi256_si128(a); in _simd_abs_epi32()
417 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_movemask_epi8()
635 _mm_storeu_si128(loaddr, _mm256_castsi256_si128(a)); in _simd_storeu2_si()
675 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_slli_epi32()
689 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_srai_epi32()
703 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_srli_epi32()
Dos.h161 _mm_storeu_si128((__m128i*)lo, _mm256_castsi256_si128(a)); in _mm256_storeu2_m128i()
/external/libhevc/common/x86/
Dihevc_platform_macros.h157 #define _mm256_storeu2_m128i(X,Y,Z) {_mm_storeu_si128 ((Y), _mm256_castsi256_si128((Z)));_mm_storeu…
/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/
Dformat_types.h124 … __m128i res16 = _mm_packus_epi32(_mm256_castsi256_si128(src), _mm256_extractf128_si256(src, 1));
239 … __m128i res16 = _mm_packs_epi32(_mm256_castsi256_si128(src), _mm256_extractf128_si256(src, 1));
353 …__m256i res = _mm256_castsi128_si256(_mm_packus_epi32(_mm256_castsi256_si128(src), _mm256_extractf…
452 …__m256i res = _mm256_castsi128_si256(_mm_packs_epi32(_mm256_castsi256_si128(src), _mm256_extractf1…
1014 …vDst = _mm256_castsi128_si256(_mm_packus_epi32(_mm256_castsi256_si128(vDst), _mm256_extractf128_si…
Dutils.h295 …__m128i c0c1 = _mm256_castsi256_si128(src); // rrrrrrrrg… in Transpose()
373 __m128i rg = _mm256_castsi256_si128(src); // rrrrrrrr gggggggg in Transpose()
/external/mesa3d/src/gallium/drivers/swr/rasterizer/memory/
DStoreTile.h739 __m128i srcLo0 = _mm256_castsi256_si128(src0); // 000r000r000r000r
740 __m128i srcLo1 = _mm256_castsi256_si128(src1); // 000g000g000g000g
741 __m128i srcLo2 = _mm256_castsi256_si128(src2); // 000b000b000b000b
742 __m128i srcLo3 = _mm256_castsi256_si128(src3); // 000a000a000a000a
904 __m128i srcLo0 = _mm256_castsi256_si128(src0); // 000r000r000r000r
905 __m128i srcLo1 = _mm256_castsi256_si128(src1); // 000g000g000g000g
906 __m128i srcLo2 = _mm256_castsi256_si128(src2); // 000b000b000b000b
/external/clang/lib/Headers/
Davxintrin.h2753 _mm256_castsi256_si128(__m256i __a) in _mm256_castsi256_si128() function
2890 __v128 = _mm256_castsi256_si128(__a); in _mm256_storeu2_m128i()
/external/clang/test/CodeGen/
Davx-builtins.c200 return _mm256_castsi256_si128(A); in test_mm256_castsi256_si128()
/external/eigen/Eigen/src/Core/arch/AVX/
DPacketMath.h323 return _mm_cvtsi128_si32(_mm256_castsi256_si128(a));