/external/libavc/common/x86/ |
D | ih264_ihadamard_scaling_ssse3.c | 97 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_ihadamard_scaling_4x4_ssse3() local 111 src_r1 = _mm_unpackhi_epi16(src_r0_r1, sign_reg); in ih264_ihadamard_scaling_4x4_ssse3() 127 temp0 = _mm_unpacklo_epi32(src_r0, src_r1); //a0 b0 a1 b1 in ih264_ihadamard_scaling_4x4_ssse3() 129 temp1 = _mm_unpackhi_epi32(src_r0, src_r1); //a2 b2 a3 b3 in ih264_ihadamard_scaling_4x4_ssse3() 132 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //a1 b1 c1 d1 in ih264_ihadamard_scaling_4x4_ssse3() 137 temp1 = _mm_add_epi32(src_r1, src_r2); in ih264_ihadamard_scaling_4x4_ssse3() 138 temp2 = _mm_sub_epi32(src_r1, src_r2); in ih264_ihadamard_scaling_4x4_ssse3() 142 src_r1 = _mm_add_epi32(temp2, temp3); in ih264_ihadamard_scaling_4x4_ssse3() 156 temp0 = _mm_unpacklo_epi32(src_r0, src_r1); //a0 a1 b0 b1 in ih264_ihadamard_scaling_4x4_ssse3() 158 temp1 = _mm_unpackhi_epi32(src_r0, src_r1); //c0 c1 d0 d1 in ih264_ihadamard_scaling_4x4_ssse3() [all …]
|
D | ih264_resi_trans_quant_sse42.c | 118 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_resi_trans_quant_4x4_sse42() local 130 …src_r1 = _mm_loadl_epi64((__m128i *) (&pu1_src[src_strd])); //a10 a11 a12 a13 0 0 0 0 0 0 0 0 -- a… in ih264_resi_trans_quant_4x4_sse42() 135 src_r1 = _mm_cvtepu8_epi16(src_r1); in ih264_resi_trans_quant_4x4_sse42() 150 src_r1 = _mm_sub_epi16(src_r1, pred_r1); in ih264_resi_trans_quant_4x4_sse42() 165 temp0 = _mm_unpacklo_epi16(src_r0, src_r1); //a0 b0 a1 b1 a2 b2 a3 b3 in ih264_resi_trans_quant_4x4_sse42() 171 src_r1 = _mm_unpackhi_epi64(temp1, zero_8x16b); //a1 b1 c1 d1 in ih264_resi_trans_quant_4x4_sse42() 179 temp1 = _mm_add_epi16(src_r1, src_r2); in ih264_resi_trans_quant_4x4_sse42() 181 temp2 = _mm_sub_epi16(src_r1, src_r2); in ih264_resi_trans_quant_4x4_sse42() 188 src_r1 = _mm_slli_epi16(temp3, 1); //(x3<<1) in ih264_resi_trans_quant_4x4_sse42() 189 src_r1 = _mm_add_epi16(src_r1, temp2); in ih264_resi_trans_quant_4x4_sse42() [all …]
|
D | ih264_ihadamard_scaling_sse42.c | 97 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_ihadamard_scaling_4x4_sse42() local 108 src_r1 = _mm_cvtepi16_epi32(src_r0_r1); in ih264_ihadamard_scaling_4x4_sse42() 125 temp0 = _mm_unpacklo_epi32(src_r0, src_r1); //a0 b0 a1 b1 in ih264_ihadamard_scaling_4x4_sse42() 127 temp1 = _mm_unpackhi_epi32(src_r0, src_r1); //a2 b2 a3 b3 in ih264_ihadamard_scaling_4x4_sse42() 130 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //a1 b1 c1 d1 in ih264_ihadamard_scaling_4x4_sse42() 135 temp1 = _mm_add_epi32(src_r1, src_r2); in ih264_ihadamard_scaling_4x4_sse42() 136 temp2 = _mm_sub_epi32(src_r1, src_r2); in ih264_ihadamard_scaling_4x4_sse42() 140 src_r1 = _mm_add_epi32(temp2, temp3); in ih264_ihadamard_scaling_4x4_sse42() 154 temp0 = _mm_unpacklo_epi32(src_r0, src_r1); //a0 a1 b0 b1 in ih264_ihadamard_scaling_4x4_sse42() 156 temp1 = _mm_unpackhi_epi32(src_r0, src_r1); //c0 c1 d0 d1 in ih264_ihadamard_scaling_4x4_sse42() [all …]
|
D | ih264_iquant_itrans_recon_sse42.c | 114 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_iquant_itrans_recon_4x4_sse42() local 145 src_r1 = _mm_unpackhi_epi16(src_r0_r1, zero_8x16b); // a10 0 a11 0 a12 0 a13 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_sse42() 150 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_4x4_sse42() 363 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_iquant_itrans_recon_chroma_4x4_sse42() local 396 src_r1 = _mm_unpackhi_epi16(src_r0_r1, zero_8x16b); // a10 0 a11 0 a12 0 a13 0 -- 16 bit long in ih264_iquant_itrans_recon_chroma_4x4_sse42() 401 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_chroma_4x4_sse42()
|
D | ih264_iquant_itrans_recon_ssse3.c | 114 __m128i src_r0, src_r1, src_r2, src_r3; in ih264_iquant_itrans_recon_4x4_ssse3() local 146 src_r1 = _mm_unpackhi_epi16(src_r0_r1, zero_8x16b); // a10 0 a11 0 a12 0 a13 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_ssse3() 151 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_4x4_ssse3()
|
/external/libmpeg2/common/x86/ |
D | impeg2_inter_pred_sse42_intr.c | 76 __m128i src_r0, src_r1, src_r2, src_r3; in impeg2_copy_mb_sse42() local 85 src_r1 = _mm_loadu_si128((__m128i *) (src + src_wd)); in impeg2_copy_mb_sse42() 90 _mm_storeu_si128((__m128i *) (dst + dst_wd), src_r1); in impeg2_copy_mb_sse42() 98 src_r1 = _mm_loadu_si128((__m128i *) (src + src_wd)); in impeg2_copy_mb_sse42() 103 _mm_storeu_si128((__m128i *) (dst + dst_wd), src_r1); in impeg2_copy_mb_sse42() 111 src_r1 = _mm_loadu_si128((__m128i *) (src + src_wd)); in impeg2_copy_mb_sse42() 116 _mm_storeu_si128((__m128i *) (dst + dst_wd), src_r1); in impeg2_copy_mb_sse42() 124 src_r1 = _mm_loadu_si128((__m128i *) (src + src_wd)); in impeg2_copy_mb_sse42() 129 _mm_storeu_si128((__m128i *) (dst + dst_wd), src_r1); in impeg2_copy_mb_sse42() 144 src_r1 = _mm_loadl_epi64((__m128i *)(src + src_wd)); in impeg2_copy_mb_sse42() [all …]
|
D | icv_variance_ssse3.c | 90 __m128 src_r0, src_r1; in icv_variance_8x4_ssse3() local 113 src_r1 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src)); in icv_variance_8x4_ssse3() 119 src_r1 = _mm_loadh_pi (src_r1, (__m64 *) (pu1_src)); in icv_variance_8x4_ssse3() 125 sum_r1 = _mm_sad_epu8((__m128i)src_r1, zero); in icv_variance_8x4_ssse3() 135 ssrc_r1 = _mm_unpacklo_epi8((__m128i)src_r1, zero); in icv_variance_8x4_ssse3() 137 ssrc_r3 = _mm_unpackhi_epi8((__m128i)src_r1, zero); in icv_variance_8x4_ssse3()
|
D | icv_sad_ssse3.c | 98 __m128 src_r0, src_r1; in icv_sad_8x4_ssse3() local 111 src_r1 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src)); in icv_sad_8x4_ssse3() 117 src_r1 = _mm_loadh_pi (src_r1, (__m64 *) (pu1_src)); in icv_sad_8x4_ssse3() 136 res_r1 = _mm_sad_epu8((__m128i)src_r1, (__m128i)ref_r1); in icv_sad_8x4_ssse3()
|
/external/libavc/encoder/x86/ |
D | ime_distortion_metrics_sse42.c | 108 __m128i src_r0, src_r1, src_r2, src_r3; in ime_compute_sad_16x16_sse42() local 117 src_r1 = _mm_loadu_si128((__m128i *) (pu1_src + src_strd)); in ime_compute_sad_16x16_sse42() 127 res_r1 = _mm_sad_epu8(src_r1, est_r1); in ime_compute_sad_16x16_sse42() 140 src_r1 = _mm_loadu_si128((__m128i *) (pu1_src + src_strd)); in ime_compute_sad_16x16_sse42() 150 res_r1 = _mm_sad_epu8(src_r1, est_r1); in ime_compute_sad_16x16_sse42() 163 src_r1 = _mm_loadu_si128((__m128i *) (pu1_src + src_strd)); in ime_compute_sad_16x16_sse42() 173 res_r1 = _mm_sad_epu8(src_r1, est_r1); in ime_compute_sad_16x16_sse42() 186 src_r1 = _mm_loadu_si128((__m128i *) (pu1_src + src_strd)); in ime_compute_sad_16x16_sse42() 196 res_r1 = _mm_sad_epu8(src_r1, est_r1); in ime_compute_sad_16x16_sse42() 252 __m128i src_r0, src_r1, src_r2, src_r3; in ime_compute_sad_16x8_sse42() local [all …]
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/ |
D | format_utils.h | 452 simd4scalar src_r1 = SIMD128::load_ps(pfSrc + 4); in Transpose() local 458 simd4scalar dst2 = SIMD128::unpacklo_ps(src_r1, src_g1); in Transpose() 459 simd4scalar dst3 = SIMD128::unpackhi_ps(src_r1, src_g1); in Transpose()
|