/external/clang/lib/Headers/ |
D | xopintrin.h | 36 static __inline__ __m128i __DEFAULT_FN_ATTRS 37 _mm_maccs_epi16(__m128i __A, __m128i __B, __m128i __C) in _mm_maccs_epi16() 39 return (__m128i)__builtin_ia32_vpmacssww((__v8hi)__A, (__v8hi)__B, (__v8hi)__C); in _mm_maccs_epi16() 42 static __inline__ __m128i __DEFAULT_FN_ATTRS 43 _mm_macc_epi16(__m128i __A, __m128i __B, __m128i __C) in _mm_macc_epi16() 45 return (__m128i)__builtin_ia32_vpmacsww((__v8hi)__A, (__v8hi)__B, (__v8hi)__C); in _mm_macc_epi16() 48 static __inline__ __m128i __DEFAULT_FN_ATTRS 49 _mm_maccsd_epi16(__m128i __A, __m128i __B, __m128i __C) in _mm_maccsd_epi16() 51 return (__m128i)__builtin_ia32_vpmacsswd((__v8hi)__A, (__v8hi)__B, (__v4si)__C); in _mm_maccsd_epi16() 54 static __inline__ __m128i __DEFAULT_FN_ATTRS [all …]
|
D | emmintrin.h | 30 typedef long long __m128i __attribute__((__vector_size__(16))); typedef 393 _mm_cvtepi32_pd(__m128i __a) in _mm_cvtepi32_pd() 398 static __inline__ __m128i __DEFAULT_FN_ATTRS 431 static __inline__ __m128i __DEFAULT_FN_ATTRS 434 return (__m128i)__builtin_ia32_cvttpd2dq(__a); in _mm_cvttpd_epi32() 629 static __inline__ __m128i __DEFAULT_FN_ATTRS 630 _mm_add_epi8(__m128i __a, __m128i __b) in _mm_add_epi8() 632 return (__m128i)((__v16qi)__a + (__v16qi)__b); in _mm_add_epi8() 635 static __inline__ __m128i __DEFAULT_FN_ATTRS 636 _mm_add_epi16(__m128i __a, __m128i __b) in _mm_add_epi16() [all …]
|
D | smmintrin.h | 101 static __inline__ __m128i __DEFAULT_FN_ATTRS 102 _mm_blendv_epi8 (__m128i __V1, __m128i __V2, __m128i __M) in _mm_blendv_epi8() 104 return (__m128i) __builtin_ia32_pblendvb128 ((__v16qi)__V1, (__v16qi)__V2, in _mm_blendv_epi8() 109 (__m128i)__builtin_shufflevector((__v8hi)(__m128i)(V1), \ 110 (__v8hi)(__m128i)(V2), \ 121 static __inline__ __m128i __DEFAULT_FN_ATTRS 122 _mm_mullo_epi32 (__m128i __V1, __m128i __V2) in _mm_mullo_epi32() 124 return (__m128i) ((__v4si)__V1 * (__v4si)__V2); in _mm_mullo_epi32() 127 static __inline__ __m128i __DEFAULT_FN_ATTRS 128 _mm_mul_epi32 (__m128i __V1, __m128i __V2) in _mm_mul_epi32() [all …]
|
D | avx512vlbwintrin.h | 37 _mm_cmpeq_epi8_mask(__m128i __a, __m128i __b) { in _mm_cmpeq_epi8_mask() 43 _mm_mask_cmpeq_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) { in _mm_mask_cmpeq_epi8_mask() 49 _mm_cmpeq_epu8_mask(__m128i __a, __m128i __b) { in _mm_cmpeq_epu8_mask() 55 _mm_mask_cmpeq_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) { in _mm_mask_cmpeq_epu8_mask() 85 _mm_cmpeq_epi16_mask(__m128i __a, __m128i __b) { in _mm_cmpeq_epi16_mask() 91 _mm_mask_cmpeq_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) { in _mm_mask_cmpeq_epi16_mask() 97 _mm_cmpeq_epu16_mask(__m128i __a, __m128i __b) { in _mm_cmpeq_epu16_mask() 103 _mm_mask_cmpeq_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) { in _mm_mask_cmpeq_epu16_mask() 133 _mm_cmpge_epi8_mask(__m128i __a, __m128i __b) { in _mm_cmpge_epi8_mask() 139 _mm_mask_cmpge_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) { in _mm_mask_cmpge_epi8_mask() [all …]
|
/external/clang/test/CodeGen/ |
D | xop-builtins.c | 8 __m128i test_mm_maccs_epi16(__m128i a, __m128i b, __m128i c) { in test_mm_maccs_epi16() 14 __m128i test_mm_macc_epi16(__m128i a, __m128i b, __m128i c) { in test_mm_macc_epi16() 20 __m128i test_mm_maccsd_epi16(__m128i a, __m128i b, __m128i c) { in test_mm_maccsd_epi16() 26 __m128i test_mm_maccd_epi16(__m128i a, __m128i b, __m128i c) { in test_mm_maccd_epi16() 32 __m128i test_mm_maccs_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_maccs_epi32() 38 __m128i test_mm_macc_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_macc_epi32() 44 __m128i test_mm_maccslo_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_maccslo_epi32() 50 __m128i test_mm_macclo_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_macclo_epi32() 56 __m128i test_mm_maccshi_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_maccshi_epi32() 62 __m128i test_mm_macchi_epi32(__m128i a, __m128i b, __m128i c) { in test_mm_macchi_epi32() [all …]
|
D | sse2-builtins.c | 9 __m128i test_mm_add_epi8(__m128i A, __m128i B) { in test_mm_add_epi8() 15 __m128i test_mm_add_epi16(__m128i A, __m128i B) { in test_mm_add_epi16() 21 __m128i test_mm_add_epi32(__m128i A, __m128i B) { in test_mm_add_epi32() 27 __m128i test_mm_add_epi64(__m128i A, __m128i B) { in test_mm_add_epi64() 45 __m128i test_mm_adds_epi8(__m128i A, __m128i B) { in test_mm_adds_epi8() 51 __m128i test_mm_adds_epi16(__m128i A, __m128i B) { in test_mm_adds_epi16() 57 __m128i test_mm_adds_epu8(__m128i A, __m128i B) { in test_mm_adds_epu8() 63 __m128i test_mm_adds_epu16(__m128i A, __m128i B) { in test_mm_adds_epu16() 75 __m128i test_mm_and_si128(__m128i A, __m128i B) { in test_mm_and_si128() 81 __m128i test_mm_avg_epu8(__m128i A, __m128i B) { in test_mm_avg_epu8() [all …]
|
D | sse41-builtins.c | 9 __m128i test_mm_blend_epi16(__m128i V1, __m128i V2) { in test_mm_blend_epi16() 27 __m128i test_mm_blendv_epi8(__m128i V1, __m128i V2, __m128i V3) { in test_mm_blendv_epi8() 69 __m128i test_mm_cmpeq_epi64(__m128i A, __m128i B) { in test_mm_cmpeq_epi64() 75 __m128i test_mm_cvtepi8_epi16(__m128i a) { in test_mm_cvtepi8_epi16() 81 __m128i test_mm_cvtepi8_epi32(__m128i a) { in test_mm_cvtepi8_epi32() 87 __m128i test_mm_cvtepi8_epi64(__m128i a) { in test_mm_cvtepi8_epi64() 93 __m128i test_mm_cvtepi16_epi32(__m128i a) { in test_mm_cvtepi16_epi32() 99 __m128i test_mm_cvtepi16_epi64(__m128i a) { in test_mm_cvtepi16_epi64() 105 __m128i test_mm_cvtepi32_epi64(__m128i a) { in test_mm_cvtepi32_epi64() 111 __m128i test_mm_cvtepu8_epi16(__m128i a) { in test_mm_cvtepu8_epi16() [all …]
|
D | ssse3-builtins.c | 8 __m128i test_mm_abs_epi8(__m128i a) { in test_mm_abs_epi8() 14 __m128i test_mm_abs_epi16(__m128i a) { in test_mm_abs_epi16() 20 __m128i test_mm_abs_epi32(__m128i a) { in test_mm_abs_epi32() 26 __m128i test_mm_alignr_epi8(__m128i a, __m128i b) { in test_mm_alignr_epi8() 32 __m128i test2_mm_alignr_epi8(__m128i a, __m128i b) { in test2_mm_alignr_epi8() 38 __m128i test_mm_hadd_epi16(__m128i a, __m128i b) { in test_mm_hadd_epi16() 44 __m128i test_mm_hadd_epi32(__m128i a, __m128i b) { in test_mm_hadd_epi32() 50 __m128i test_mm_hadds_epi16(__m128i a, __m128i b) { in test_mm_hadds_epi16() 56 __m128i test_mm_hsub_epi16(__m128i a, __m128i b) { in test_mm_hsub_epi16() 62 __m128i test_mm_hsub_epi32(__m128i a, __m128i b) { in test_mm_hsub_epi32() [all …]
|
D | avx512vlbw-builtins.c | 21 __mmask16 test_mm_cmpeq_epi8_mask(__m128i __a, __m128i __b) { in test_mm_cmpeq_epi8_mask() 27 __mmask16 test_mm_mask_cmpeq_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) { in test_mm_mask_cmpeq_epi8_mask() 45 __mmask8 test_mm_cmpeq_epi16_mask(__m128i __a, __m128i __b) { in test_mm_cmpeq_epi16_mask() 51 __mmask8 test_mm_mask_cmpeq_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) { in test_mm_mask_cmpeq_epi16_mask() 69 __mmask16 test_mm_cmpgt_epi8_mask(__m128i __a, __m128i __b) { in test_mm_cmpgt_epi8_mask() 75 __mmask16 test_mm_mask_cmpgt_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) { in test_mm_mask_cmpgt_epi8_mask() 93 __mmask8 test_mm_cmpgt_epi16_mask(__m128i __a, __m128i __b) { in test_mm_cmpgt_epi16_mask() 99 __mmask8 test_mm_mask_cmpgt_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) { in test_mm_mask_cmpgt_epi16_mask() 105 __mmask16 test_mm_cmpeq_epu8_mask(__m128i __a, __m128i __b) { in test_mm_cmpeq_epu8_mask() 111 __mmask16 test_mm_mask_cmpeq_epu8_mask(__mmask64 __u, __m128i __a, __m128i __b) { in test_mm_mask_cmpeq_epu8_mask() [all …]
|
D | sse42-builtins.c | 9 __m128i test_mm_cmpgt_epi8(__m128i A, __m128i B) { in test_mm_cmpgt_epi8() 15 __m128i test_mm_cmpgt_epi16(__m128i A, __m128i B) { in test_mm_cmpgt_epi16() 21 __m128i test_mm_cmpgt_epi32(__m128i A, __m128i B) { in test_mm_cmpgt_epi32() 27 __m128i test_mm_cmpgt_epi64(__m128i A, __m128i B) { in test_mm_cmpgt_epi64() 33 int test_mm_cmpestra(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestra() 39 int test_mm_cmpestrc(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestrc() 45 int test_mm_cmpestri(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestri() 51 __m128i test_mm_cmpestrm(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestrm() 57 int test_mm_cmpestro(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestro() 63 int test_mm_cmpestrs(__m128i A, int LA, __m128i B, int LB) { in test_mm_cmpestrs() [all …]
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | fwd_txfm_sse2.h | 21 static INLINE __m128i k_madd_epi32(__m128i a, __m128i b) { in k_madd_epi32() 22 __m128i buf0, buf1; in k_madd_epi32() 30 static INLINE __m128i k_packs_epi64(__m128i a, __m128i b) { in k_packs_epi64() 31 __m128i buf0 = _mm_shuffle_epi32(a, _MM_SHUFFLE(0, 0, 2, 0)); in k_packs_epi64() 32 __m128i buf1 = _mm_shuffle_epi32(b, _MM_SHUFFLE(0, 0, 2, 0)); in k_packs_epi64() 36 static INLINE int check_epi16_overflow_x2(const __m128i *preg0, in check_epi16_overflow_x2() 37 const __m128i *preg1) { in check_epi16_overflow_x2() 38 const __m128i max_overflow = _mm_set1_epi16(0x7fff); in check_epi16_overflow_x2() 39 const __m128i min_overflow = _mm_set1_epi16(0x8000); in check_epi16_overflow_x2() 40 __m128i cmp0 = _mm_or_si128(_mm_cmpeq_epi16(*preg0, max_overflow), in check_epi16_overflow_x2() [all …]
|
D | fwd_txfm_impl_sse2.h | 46 const __m128i k__cospi_A = octa_set_epi16(cospi_16_64, cospi_16_64, in FDCT4x4_2D() 50 const __m128i k__cospi_B = octa_set_epi16(cospi_16_64, -cospi_16_64, in FDCT4x4_2D() 54 const __m128i k__cospi_C = octa_set_epi16(cospi_8_64, cospi_24_64, in FDCT4x4_2D() 58 const __m128i k__cospi_D = octa_set_epi16(cospi_24_64, -cospi_8_64, in FDCT4x4_2D() 62 const __m128i k__cospi_E = octa_set_epi16(cospi_16_64, cospi_16_64, in FDCT4x4_2D() 66 const __m128i k__cospi_F = octa_set_epi16(cospi_16_64, -cospi_16_64, in FDCT4x4_2D() 70 const __m128i k__cospi_G = octa_set_epi16(cospi_8_64, cospi_24_64, in FDCT4x4_2D() 74 const __m128i k__cospi_H = octa_set_epi16(cospi_24_64, -cospi_8_64, in FDCT4x4_2D() 79 const __m128i k__DCT_CONST_ROUNDING = _mm_set1_epi32(DCT_CONST_ROUNDING); in FDCT4x4_2D() 81 const __m128i k__DCT_CONST_ROUNDING2 = _mm_set1_epi32(DCT_CONST_ROUNDING in FDCT4x4_2D() [all …]
|
D | vpx_subpixel_8t_intrin_ssse3.c | 61 __m128i firstFilters, secondFilters, shuffle1, shuffle2; in vpx_filter_block1d4_h8_intrin_ssse3() 62 __m128i srcRegFilt1, srcRegFilt2, srcRegFilt3, srcRegFilt4; in vpx_filter_block1d4_h8_intrin_ssse3() 63 __m128i addFilterReg64, filtersReg, srcReg, minReg; in vpx_filter_block1d4_h8_intrin_ssse3() 68 filtersReg = _mm_loadu_si128((const __m128i *)filter); in vpx_filter_block1d4_h8_intrin_ssse3() 85 shuffle1 =_mm_load_si128((__m128i const *)filt1_4_h8); in vpx_filter_block1d4_h8_intrin_ssse3() 86 shuffle2 = _mm_load_si128((__m128i const *)filt2_4_h8); in vpx_filter_block1d4_h8_intrin_ssse3() 89 srcReg = _mm_loadu_si128((const __m128i *)(src_ptr - 3)); in vpx_filter_block1d4_h8_intrin_ssse3() 132 __m128i firstFilters, secondFilters, thirdFilters, forthFilters, srcReg; in vpx_filter_block1d8_h8_intrin_ssse3() 133 __m128i filt1Reg, filt2Reg, filt3Reg, filt4Reg; in vpx_filter_block1d8_h8_intrin_ssse3() 134 __m128i srcRegFilt1, srcRegFilt2, srcRegFilt3, srcRegFilt4; in vpx_filter_block1d8_h8_intrin_ssse3() [all …]
|
/external/opencv3/3rdparty/libwebp/dsp/ |
D | enc_sse2.c | 31 static void PrintReg(const __m128i r, const char* const name, int size) { 34 __m128i r; 62 const __m128i max_coeff_thresh = _mm_set1_epi16(MAX_COEFF_THRESH); in CollectHistogramSSE2() 73 const __m128i out0 = _mm_loadu_si128((__m128i*)&out[0]); in CollectHistogramSSE2() 74 const __m128i out1 = _mm_loadu_si128((__m128i*)&out[8]); in CollectHistogramSSE2() 76 const __m128i sign0 = _mm_srai_epi16(out0, 15); in CollectHistogramSSE2() 77 const __m128i sign1 = _mm_srai_epi16(out1, 15); in CollectHistogramSSE2() 79 const __m128i xor0 = _mm_xor_si128(out0, sign0); in CollectHistogramSSE2() 80 const __m128i xor1 = _mm_xor_si128(out1, sign1); in CollectHistogramSSE2() 81 const __m128i abs0 = _mm_sub_epi16(xor0, sign0); in CollectHistogramSSE2() [all …]
|
/external/webp/src/dsp/ |
D | enc_sse2.c | 28 static void PrintReg(const __m128i r, const char* const name, int size) { 31 __m128i r; 74 const __m128i k1 = _mm_set1_epi16(20091); in ITransform() 75 const __m128i k2 = _mm_set1_epi16(-30068); in ITransform() 76 __m128i T0, T1, T2, T3; in ITransform() 82 __m128i in0, in1, in2, in3; in ITransform() 84 in0 = _mm_loadl_epi64((const __m128i*)&in[0]); in ITransform() 85 in1 = _mm_loadl_epi64((const __m128i*)&in[4]); in ITransform() 86 in2 = _mm_loadl_epi64((const __m128i*)&in[8]); in ITransform() 87 in3 = _mm_loadl_epi64((const __m128i*)&in[12]); in ITransform() [all …]
|
D | lossless_sse2.c | 26 const __m128i zero = _mm_setzero_si128(); in ClampedAddSubtractFull() 27 const __m128i C0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c0), zero); in ClampedAddSubtractFull() 28 const __m128i C1 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c1), zero); in ClampedAddSubtractFull() 29 const __m128i C2 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c2), zero); in ClampedAddSubtractFull() 30 const __m128i V1 = _mm_add_epi16(C0, C1); in ClampedAddSubtractFull() 31 const __m128i V2 = _mm_sub_epi16(V1, C2); in ClampedAddSubtractFull() 32 const __m128i b = _mm_packus_epi16(V2, V2); in ClampedAddSubtractFull() 39 const __m128i zero = _mm_setzero_si128(); in ClampedAddSubtractHalf() 40 const __m128i C0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c0), zero); in ClampedAddSubtractHalf() 41 const __m128i C1 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c1), zero); in ClampedAddSubtractHalf() [all …]
|
D | enc_sse41.c | 28 const __m128i max_coeff_thresh = _mm_set1_epi16(MAX_COEFF_THRESH); in CollectHistogram() 40 const __m128i out0 = _mm_loadu_si128((__m128i*)&out[0]); in CollectHistogram() 41 const __m128i out1 = _mm_loadu_si128((__m128i*)&out[8]); in CollectHistogram() 43 const __m128i abs0 = _mm_abs_epi16(out0); in CollectHistogram() 44 const __m128i abs1 = _mm_abs_epi16(out1); in CollectHistogram() 45 const __m128i v0 = _mm_srai_epi16(abs0, 3); in CollectHistogram() 46 const __m128i v1 = _mm_srai_epi16(abs1, 3); in CollectHistogram() 48 const __m128i bin0 = _mm_min_epi16(v0, max_coeff_thresh); in CollectHistogram() 49 const __m128i bin1 = _mm_min_epi16(v1, max_coeff_thresh); in CollectHistogram() 51 _mm_storeu_si128((__m128i*)&out[0], bin0); in CollectHistogram() [all …]
|
D | alpha_processing_sse2.c | 28 const __m128i zero = _mm_setzero_si128(); in DispatchAlpha() 29 const __m128i rgb_mask = _mm_set1_epi32(0xffffff00u); // to preserve RGB in DispatchAlpha() 30 const __m128i all_0xff = _mm_set_epi32(0, 0, ~0u, ~0u); in DispatchAlpha() 31 __m128i all_alphas = all_0xff; in DispatchAlpha() 39 __m128i* out = (__m128i*)dst; in DispatchAlpha() 42 const __m128i a0 = _mm_loadl_epi64((const __m128i*)&alpha[i]); in DispatchAlpha() 43 const __m128i a1 = _mm_unpacklo_epi8(a0, zero); in DispatchAlpha() 44 const __m128i a2_lo = _mm_unpacklo_epi16(a1, zero); in DispatchAlpha() 45 const __m128i a2_hi = _mm_unpackhi_epi16(a1, zero); in DispatchAlpha() 47 const __m128i b0_lo = _mm_loadu_si128(out + 0); in DispatchAlpha() [all …]
|
D | dec_sse2.c | 46 const __m128i k1 = _mm_set1_epi16(20091); in Transform() 47 const __m128i k2 = _mm_set1_epi16(-30068); in Transform() 48 __m128i T0, T1, T2, T3; in Transform() 53 __m128i in0, in1, in2, in3; in Transform() 55 in0 = _mm_loadl_epi64((const __m128i*)&in[0]); in Transform() 56 in1 = _mm_loadl_epi64((const __m128i*)&in[4]); in Transform() 57 in2 = _mm_loadl_epi64((const __m128i*)&in[8]); in Transform() 58 in3 = _mm_loadl_epi64((const __m128i*)&in[12]); in Transform() 64 const __m128i inB0 = _mm_loadl_epi64((const __m128i*)&in[16]); in Transform() 65 const __m128i inB1 = _mm_loadl_epi64((const __m128i*)&in[20]); in Transform() [all …]
|
D | lossless_enc_sse2.c | 30 const __m128i in = _mm_loadu_si128((__m128i*)&argb_data[i]); // argb in SubtractGreenFromBlueAndRed() 31 const __m128i A = _mm_srli_epi16(in, 8); // 0 a 0 g in SubtractGreenFromBlueAndRed() 32 const __m128i B = _mm_shufflelo_epi16(A, _MM_SHUFFLE(2, 2, 0, 0)); in SubtractGreenFromBlueAndRed() 33 const __m128i C = _mm_shufflehi_epi16(B, _MM_SHUFFLE(2, 2, 0, 0)); // 0g0g in SubtractGreenFromBlueAndRed() 34 const __m128i out = _mm_sub_epi8(in, C); in SubtractGreenFromBlueAndRed() 35 _mm_storeu_si128((__m128i*)&argb_data[i], out); in SubtractGreenFromBlueAndRed() 46 const __m128i mults_rb = _mm_set_epi16( in TransformColor() 51 const __m128i mults_b2 = _mm_set_epi16( in TransformColor() 54 const __m128i mask_ag = _mm_set1_epi32(0xff00ff00); // alpha-green masks in TransformColor() 55 const __m128i mask_rb = _mm_set1_epi32(0x00ff00ff); // red-blue masks in TransformColor() [all …]
|
/external/skia/src/opts/ |
D | SkColor_opts_SSE2.h | 19 static inline __m128i Multiply32_SSE2(const __m128i& a, const __m128i& b) { in Multiply32_SSE2() 21 __m128i r1 = _mm_mul_epu32(a, b); in Multiply32_SSE2() 23 __m128i r2 = _mm_mul_epu32(_mm_srli_si128(a, 4), _mm_srli_si128(b, 4)); in Multiply32_SSE2() 25 __m128i r = _mm_unpacklo_epi32(_mm_shuffle_epi32(r1, _MM_SHUFFLE(0,0,2,0)), in Multiply32_SSE2() 30 static inline __m128i SkAlpha255To256_SSE2(const __m128i& alpha) { in SkAlpha255To256_SSE2() 35 static inline __m128i SkAlphaMulAlpha_SSE2(const __m128i& a, in SkAlphaMulAlpha_SSE2() 36 const __m128i& b) { in SkAlphaMulAlpha_SSE2() 37 __m128i prod = _mm_mullo_epi16(a, b); in SkAlphaMulAlpha_SSE2() 46 static inline __m128i SkAlphaMulQ_SSE2(const __m128i& c, const __m128i& scale) { in SkAlphaMulQ_SSE2() 47 const __m128i mask = _mm_set1_epi32(0xFF00FF); in SkAlphaMulQ_SSE2() [all …]
|
/external/libmpeg2/common/x86/ |
D | impeg2_inter_pred_sse42_intr.c | 76 __m128i src_r0, src_r1, src_r2, src_r3; in impeg2_copy_mb_sse42() 84 src_r0 = _mm_loadu_si128((__m128i *) (src)); in impeg2_copy_mb_sse42() 85 src_r1 = _mm_loadu_si128((__m128i *) (src + src_wd)); in impeg2_copy_mb_sse42() 86 src_r2 = _mm_loadu_si128((__m128i *) (src + 2 * src_wd)); in impeg2_copy_mb_sse42() 87 src_r3 = _mm_loadu_si128((__m128i *) (src + 3 * src_wd)); in impeg2_copy_mb_sse42() 89 _mm_storeu_si128((__m128i *) dst, src_r0); in impeg2_copy_mb_sse42() 90 _mm_storeu_si128((__m128i *) (dst + dst_wd), src_r1); in impeg2_copy_mb_sse42() 91 _mm_storeu_si128((__m128i *) (dst + 2 * dst_wd), src_r2); in impeg2_copy_mb_sse42() 92 _mm_storeu_si128((__m128i *) (dst + 3 * dst_wd), src_r3); in impeg2_copy_mb_sse42() 97 src_r0 = _mm_loadu_si128((__m128i *) (src)); in impeg2_copy_mb_sse42() [all …]
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_dct_ssse3.c | 33 __m128i zero; in vp9_fdct8x8_quant_ssse3() 39 const __m128i k__dual_p16_p16 = dual_set_epi16(23170, 23170); in vp9_fdct8x8_quant_ssse3() 40 const __m128i k__cospi_p16_p16 = _mm_set1_epi16((int16_t)cospi_16_64); in vp9_fdct8x8_quant_ssse3() 41 const __m128i k__cospi_p16_m16 = pair_set_epi16(cospi_16_64, -cospi_16_64); in vp9_fdct8x8_quant_ssse3() 42 const __m128i k__cospi_p24_p08 = pair_set_epi16(cospi_24_64, cospi_8_64); in vp9_fdct8x8_quant_ssse3() 43 const __m128i k__cospi_m08_p24 = pair_set_epi16(-cospi_8_64, cospi_24_64); in vp9_fdct8x8_quant_ssse3() 44 const __m128i k__cospi_p28_p04 = pair_set_epi16(cospi_28_64, cospi_4_64); in vp9_fdct8x8_quant_ssse3() 45 const __m128i k__cospi_m04_p28 = pair_set_epi16(-cospi_4_64, cospi_28_64); in vp9_fdct8x8_quant_ssse3() 46 const __m128i k__cospi_p12_p20 = pair_set_epi16(cospi_12_64, cospi_20_64); in vp9_fdct8x8_quant_ssse3() 47 const __m128i k__cospi_m20_p12 = pair_set_epi16(-cospi_20_64, cospi_12_64); in vp9_fdct8x8_quant_ssse3() [all …]
|
/external/opencv3/modules/core/include/opencv2/core/ |
D | sse_utils.hpp | 51 inline void _mm_deinterleave_epi8(__m128i & v_r0, __m128i & v_r1, __m128i & v_g0, __m128i & v_g1) in _mm_deinterleave_epi8() 53 __m128i layer1_chunk0 = _mm_unpacklo_epi8(v_r0, v_g0); in _mm_deinterleave_epi8() 54 __m128i layer1_chunk1 = _mm_unpackhi_epi8(v_r0, v_g0); in _mm_deinterleave_epi8() 55 __m128i layer1_chunk2 = _mm_unpacklo_epi8(v_r1, v_g1); in _mm_deinterleave_epi8() 56 __m128i layer1_chunk3 = _mm_unpackhi_epi8(v_r1, v_g1); in _mm_deinterleave_epi8() 58 __m128i layer2_chunk0 = _mm_unpacklo_epi8(layer1_chunk0, layer1_chunk2); in _mm_deinterleave_epi8() 59 __m128i layer2_chunk1 = _mm_unpackhi_epi8(layer1_chunk0, layer1_chunk2); in _mm_deinterleave_epi8() 60 __m128i layer2_chunk2 = _mm_unpacklo_epi8(layer1_chunk1, layer1_chunk3); in _mm_deinterleave_epi8() 61 __m128i layer2_chunk3 = _mm_unpackhi_epi8(layer1_chunk1, layer1_chunk3); in _mm_deinterleave_epi8() 63 __m128i layer3_chunk0 = _mm_unpacklo_epi8(layer2_chunk0, layer2_chunk2); in _mm_deinterleave_epi8() [all …]
|
/external/libvpx/libvpx/vp8/encoder/x86/ |
D | denoising_sse2.c | 21 static INLINE unsigned int abs_sum_diff_16x1(__m128i acc_diff) { in abs_sum_diff_16x1() 22 const __m128i k_1 = _mm_set1_epi16(1); in abs_sum_diff_16x1() 23 const __m128i acc_diff_lo = _mm_srai_epi16( in abs_sum_diff_16x1() 25 const __m128i acc_diff_hi = _mm_srai_epi16( in abs_sum_diff_16x1() 27 const __m128i acc_diff_16 = _mm_add_epi16(acc_diff_lo, acc_diff_hi); in abs_sum_diff_16x1() 28 const __m128i hg_fe_dc_ba = _mm_madd_epi16(acc_diff_16, k_1); in abs_sum_diff_16x1() 29 const __m128i hgfe_dcba = _mm_add_epi32(hg_fe_dc_ba, in abs_sum_diff_16x1() 31 const __m128i hgfedcba = _mm_add_epi32(hgfe_dcba, in abs_sum_diff_16x1() 51 __m128i acc_diff = _mm_setzero_si128(); in vp8_denoiser_filter_sse2() 52 const __m128i k_0 = _mm_setzero_si128(); in vp8_denoiser_filter_sse2() [all …]
|