/external/libvpx/libvpx/vpx_dsp/x86/ |
D | convolve_avx2.h | 80 const __m128i x0 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[0]), in convolve8_8_avx2() 81 _mm256_castsi256_si128(f[0])); in convolve8_8_avx2() 82 const __m128i x1 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[1]), in convolve8_8_avx2() 83 _mm256_castsi256_si128(f[1])); in convolve8_8_avx2() 84 const __m128i x2 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[2]), in convolve8_8_avx2() 85 _mm256_castsi256_si128(f[2])); in convolve8_8_avx2() 86 const __m128i x3 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[3]), in convolve8_8_avx2() 87 _mm256_castsi256_si128(f[3])); in convolve8_8_avx2()
|
D | vpx_subpixel_8t_intrin_avx2.c | 99 outReg1 = _mm256_castsi256_si128(outReg32b1); in vpx_filter_block1d16_h8_x_avx2() 126 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[0]))); in vpx_filter_block1d16_h8_x_avx2() 128 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[1]))); in vpx_filter_block1d16_h8_x_avx2() 130 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[2]))); in vpx_filter_block1d16_h8_x_avx2() 132 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[3]))); in vpx_filter_block1d16_h8_x_avx2() 141 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[0]))); in vpx_filter_block1d16_h8_x_avx2() 143 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[1]))); in vpx_filter_block1d16_h8_x_avx2() 145 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[2]))); in vpx_filter_block1d16_h8_x_avx2() 147 _mm_shuffle_epi8(srcReg, _mm256_castsi256_si128(filt[3]))); in vpx_filter_block1d16_h8_x_avx2() 215 _mm256_castsi256_si128(srcRegHead1), 1); in vpx_filter_block1d16_v8_x_avx2() [all …]
|
D | loopfilter_avx2.c | 410 p4 = _mm256_castsi256_si128(p256_4); in vpx_lpf_horizontal_16_dual_avx2() 411 p3 = _mm256_castsi256_si128(p256_3); in vpx_lpf_horizontal_16_dual_avx2() 412 p2 = _mm256_castsi256_si128(p256_2); in vpx_lpf_horizontal_16_dual_avx2() 413 p1 = _mm256_castsi256_si128(p256_1); in vpx_lpf_horizontal_16_dual_avx2() 414 p0 = _mm256_castsi256_si128(p256_0); in vpx_lpf_horizontal_16_dual_avx2() 415 q0 = _mm256_castsi256_si128(q256_0); in vpx_lpf_horizontal_16_dual_avx2() 416 q1 = _mm256_castsi256_si128(q256_1); in vpx_lpf_horizontal_16_dual_avx2() 417 q2 = _mm256_castsi256_si128(q256_2); in vpx_lpf_horizontal_16_dual_avx2() 418 q3 = _mm256_castsi256_si128(q256_3); in vpx_lpf_horizontal_16_dual_avx2() 419 q4 = _mm256_castsi256_si128(q256_4); in vpx_lpf_horizontal_16_dual_avx2() [all …]
|
D | sad_avx2.c | 37 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \ 69 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \ 120 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \ 158 sum_sad128 = _mm_add_epi32(_mm256_castsi256_si128(sum_sad), sum_sad128); \
|
D | highbd_convolve_avx2.c | 315 const __m128i a0 = _mm256_castsi256_si128(*y); in store_8x1_pixels() 318 res = _mm_min_epi16(res, _mm256_castsi256_si128(*mask)); in store_8x1_pixels() 327 _mm_storeu_si128((__m128i *)dst, _mm256_castsi256_si128(a)); in store_8x2_pixels() 522 s0 = _mm256_inserti128_si256(s0, _mm256_castsi256_si128(s1), 1); in pack_8x9_init() 523 s1 = _mm256_inserti128_si256(s1, _mm256_castsi256_si128(s2), 1); in pack_8x9_init() 524 s2 = _mm256_inserti128_si256(s2, _mm256_castsi256_si128(s3), 1); in pack_8x9_init() 525 s3 = _mm256_inserti128_si256(s3, _mm256_castsi256_si128(s4), 1); in pack_8x9_init() 526 s4 = _mm256_inserti128_si256(s4, _mm256_castsi256_si128(s5), 1); in pack_8x9_init() 527 s5 = _mm256_inserti128_si256(s5, _mm256_castsi256_si128(s6), 1); in pack_8x9_init() 546 __m256i s2 = _mm256_inserti128_si256(sig[8], _mm256_castsi256_si128(s0), 1); in pack_8x9_pixels() [all …]
|
D | sad4d_avx2.c | 75 sum = _mm_add_epi32(_mm256_castsi256_si128(sum_mlow), in vpx_sad32x32x4d_avx2() 159 sum = _mm_add_epi32(_mm256_castsi256_si128(sum_mlow), in vpx_sad64x64x4d_avx2()
|
D | variance_avx2.c | 75 _mm256_castsi256_si128(sum_reg), _mm256_extractf128_si256(sum_reg, 1)); in vpx_get16x16var_avx2() 77 _mm256_castsi256_si128(sse_reg), _mm256_extractf128_si256(sse_reg, 1)); in vpx_get16x16var_avx2() 144 _mm256_castsi256_si128(sum_reg), _mm256_extractf128_si256(sum_reg, 1)); in get32x16var_avx2() 146 _mm256_castsi256_si128(sse_reg), _mm256_extractf128_si256(sse_reg, 1)); in get32x16var_avx2() 208 *((int *)sse) = _mm_cvtsi128_si32(_mm256_castsi256_si128(sse_reg)) + \ 212 sum = _mm_cvtsi128_si32(_mm256_castsi256_si128(sum_reg)) + \
|
D | sad4d_avx512.c | 78 sum128 = _mm_add_epi32(_mm256_castsi256_si128(sum256), in vpx_sad64x64x4d_avx512()
|
D | avg_intrin_avx2.c | 193 const __m128i accum_128 = _mm_add_epi32(_mm256_castsi256_si128(d), in vpx_satd_avx2()
|
D | fwd_dct32x32_impl_avx2.h | 2963 _mm256_castsi256_si128(tr2_0)); in FDCT32x32_2D_AVX2() 2965 _mm256_castsi256_si128(tr2_1)); in FDCT32x32_2D_AVX2() 2967 _mm256_castsi256_si128(tr2_2)); in FDCT32x32_2D_AVX2() 2969 _mm256_castsi256_si128(tr2_3)); in FDCT32x32_2D_AVX2() 2971 _mm256_castsi256_si128(tr2_4)); in FDCT32x32_2D_AVX2() 2973 _mm256_castsi256_si128(tr2_5)); in FDCT32x32_2D_AVX2() 2975 _mm256_castsi256_si128(tr2_6)); in FDCT32x32_2D_AVX2() 2977 _mm256_castsi256_si128(tr2_7)); in FDCT32x32_2D_AVX2()
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_error_avx2.c | 96 sse_128 = _mm_add_epi64(_mm256_castsi256_si128(sse_256), in vp9_block_error_avx2() 99 ssz_128 = _mm_add_epi64(_mm256_castsi256_si128(ssz_256), in vp9_block_error_avx2() 155 sse_128 = _mm_add_epi64(_mm256_castsi256_si128(sse_256), in vp9_block_error_fp_avx2()
|
/external/flac/libFLAC/ |
D | stream_encoder_intrin_avx2.c | 74 sum128 = _mm_add_epi32(_mm256_extracti128_si256(sum256, 1), _mm256_castsi256_si128(sum256)); in FLAC__precompute_partition_info_sums_intrin_avx2() 107 sum128 = _mm_add_epi64(_mm256_extracti128_si256(sum256, 1), _mm256_castsi256_si128(sum256)); in FLAC__precompute_partition_info_sums_intrin_avx2()
|
D | lpc_intrin_avx2.c | 807 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 838 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 869 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 896 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 925 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 948 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 971 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 990 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 1011 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() 1026 …sidual+i), _mm_sub_epi32(_mm_loadu_si128((const __m128i*)(data+i)), _mm256_castsi256_si128(summ))); in FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2() [all …]
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/ |
D | simdintrin.h | 106 __m128i aLo = _mm256_castsi256_si128(a);\ 107 __m128i bLo = _mm256_castsi256_si128(b);\ 125 __m128i bLo = _mm256_castsi256_si128(b); in _simdemu_permute_ps() 405 __m128i aLo = _mm256_castsi256_si128(a); in _simd_abs_epi32() 417 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_movemask_epi8() 635 _mm_storeu_si128(loaddr, _mm256_castsi256_si128(a)); in _simd_storeu2_si() 675 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_slli_epi32() 689 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_srai_epi32() 703 __m128i aLo = _mm256_castsi256_si128(a); in _simdemu_srli_epi32()
|
D | os.h | 161 _mm_storeu_si128((__m128i*)lo, _mm256_castsi256_si128(a)); in _mm256_storeu2_m128i()
|
/external/libhevc/common/x86/ |
D | ihevc_platform_macros.h | 157 #define _mm256_storeu2_m128i(X,Y,Z) {_mm_storeu_si128 ((Y), _mm256_castsi256_si128((Z)));_mm_storeu…
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/ |
D | format_types.h | 124 … __m128i res16 = _mm_packus_epi32(_mm256_castsi256_si128(src), _mm256_extractf128_si256(src, 1)); 239 … __m128i res16 = _mm_packs_epi32(_mm256_castsi256_si128(src), _mm256_extractf128_si256(src, 1)); 353 …__m256i res = _mm256_castsi128_si256(_mm_packus_epi32(_mm256_castsi256_si128(src), _mm256_extractf… 452 …__m256i res = _mm256_castsi128_si256(_mm_packs_epi32(_mm256_castsi256_si128(src), _mm256_extractf1… 1014 …vDst = _mm256_castsi128_si256(_mm_packus_epi32(_mm256_castsi256_si128(vDst), _mm256_extractf128_si…
|
D | utils.h | 295 …__m128i c0c1 = _mm256_castsi256_si128(src); // rrrrrrrrg… in Transpose() 373 __m128i rg = _mm256_castsi256_si128(src); // rrrrrrrr gggggggg in Transpose()
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/memory/ |
D | StoreTile.h | 739 __m128i srcLo0 = _mm256_castsi256_si128(src0); // 000r000r000r000r 740 __m128i srcLo1 = _mm256_castsi256_si128(src1); // 000g000g000g000g 741 __m128i srcLo2 = _mm256_castsi256_si128(src2); // 000b000b000b000b 742 __m128i srcLo3 = _mm256_castsi256_si128(src3); // 000a000a000a000a 904 __m128i srcLo0 = _mm256_castsi256_si128(src0); // 000r000r000r000r 905 __m128i srcLo1 = _mm256_castsi256_si128(src1); // 000g000g000g000g 906 __m128i srcLo2 = _mm256_castsi256_si128(src2); // 000b000b000b000b
|
/external/clang/lib/Headers/ |
D | avxintrin.h | 2753 _mm256_castsi256_si128(__m256i __a) in _mm256_castsi256_si128() function 2890 __v128 = _mm256_castsi256_si128(__a); in _mm256_storeu2_m128i()
|
/external/clang/test/CodeGen/ |
D | avx-builtins.c | 200 return _mm256_castsi256_si128(A); in test_mm256_castsi256_si128()
|
/external/eigen/Eigen/src/Core/arch/AVX/ |
D | PacketMath.h | 323 return _mm_cvtsi128_si32(_mm256_castsi256_si128(a));
|