/external/libavc/common/x86/ |
D | ih264_luma_intra_pred_filters_ssse3.c | 342 top_sh_8x16b = _mm_srli_si128(top_8x16b, 2); //t1 t2 t3 t4 t5 t6 t7 0 in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 347 res2_8x16b = _mm_srli_si128(res1_8x16b, 2); in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 358 res_16x8b = _mm_srli_si128(res_16x8b, 1); in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 360 res_16x8b = _mm_srli_si128(res_16x8b, 1); in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 362 res_16x8b = _mm_srli_si128(res_16x8b, 1); in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 426 …top_left_sh_16x8b = _mm_srli_si128(top_left_16x8b, 1); //l2 l1 l0 tl t0 t1 t2 t3… in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 433 …res2_8x16b = _mm_srli_si128(res1_8x16b, 2); //l2+l1 l1+l0 l0+tl tl+t0… in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 443 res2_16x8b = _mm_srli_si128(res1_16x8b, 3); in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 446 res2_16x8b = _mm_srli_si128(res1_16x8b, 2); in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 448 res2_16x8b = _mm_srli_si128(res1_16x8b, 1); in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() [all …]
|
D | ih264_inter_pred_filters_ssse3.c | 255 …src_r0_sht_16x8b = _mm_srli_si128(src_r0_16x8b, 1); //a1 a2 a3 a4 a5 a6 a7 a8 … in ih264_inter_pred_luma_horz_ssse3() 256 …src_r1_sht_16x8b = _mm_srli_si128(src_r1_16x8b, 1); //b1 b2 b3 b4 b5 b6 b7 b8 … in ih264_inter_pred_luma_horz_ssse3() 265 …src_r0_16x8b = _mm_srli_si128(src_r0_16x8b, 4); //a2 a3 a3 a4 a4 a5 a5 a6 … in ih264_inter_pred_luma_horz_ssse3() 266 …src_r1_16x8b = _mm_srli_si128(src_r1_16x8b, 4); //b2 b3 b3 b4 b4 b5 b5 b6 … in ih264_inter_pred_luma_horz_ssse3() 272 …src_r0_16x8b = _mm_srli_si128(src_r0_16x8b, 4); //a4 a5 a5 a6 a6 a7 a7 a8 … in ih264_inter_pred_luma_horz_ssse3() 273 …src_r1_16x8b = _mm_srli_si128(src_r1_16x8b, 4); //b4 b5 b5 b6 b6 b7 b7 b8 … in ih264_inter_pred_luma_horz_ssse3() 295 res_r0r1_16x8b = _mm_srli_si128(res_r0r1_16x8b, 4); in ih264_inter_pred_luma_horz_ssse3() 320 …src_r0_sht_16x8b = _mm_srli_si128(src_r0_16x8b, 1); //a1 a2 a3 a4 a5 a6 a7 a8 a9… in ih264_inter_pred_luma_horz_ssse3() 321 …src_r1_sht_16x8b = _mm_srli_si128(src_r1_16x8b, 1); //b1 b2 b3 b4 b5 b6 b7 b8 b9… in ih264_inter_pred_luma_horz_ssse3() 331 …src_r0_16x8b = _mm_srli_si128(src_r0_16x8b, 2); //a2 a3 a4 a5 a6 a7 a8 a9...… in ih264_inter_pred_luma_horz_ssse3() [all …]
|
/external/flac/libFLAC/ |
D | fixed_intrin_sse2.c | 87 last_error = _mm_srli_si128(last_error, 4); // 0 le0 le1 le2 in FLAC__fixed_compute_best_predictor_intrin_sse2() 89 last_error = _mm_srli_si128(last_error, 4); // 0 0 le0 le1 in FLAC__fixed_compute_best_predictor_intrin_sse2() 91 last_error = _mm_srli_si128(last_error, 4); // 0 0 0 le0 in FLAC__fixed_compute_best_predictor_intrin_sse2() 94 …last_error = _mm_add_epi32(last_error, _mm_srli_si128(last_error, 8)); // le0 le1 le2+le0 le3+l… in FLAC__fixed_compute_best_predictor_intrin_sse2() 95 …last_error = _mm_add_epi32(last_error, _mm_srli_si128(last_error, 4)); // le0 le1+le0 le2+le0+le… in FLAC__fixed_compute_best_predictor_intrin_sse2() 99 last_error = _mm_srli_si128(err1, 4); // 0 e1 e2 e3 in FLAC__fixed_compute_best_predictor_intrin_sse2() 116 total_err1 = _mm_srli_si128(total_err1, 8); // 0 0 te1 te2 in FLAC__fixed_compute_best_predictor_intrin_sse2() 119 total_err2 = _mm_srli_si128(total_err2, 4); // 0 te1 te2 te3 in FLAC__fixed_compute_best_predictor_intrin_sse2() 120 total_err1 = _mm_srli_si128(total_err1, 4); // 0 0 0 te1 in FLAC__fixed_compute_best_predictor_intrin_sse2() 184 last_error = _mm_srli_si128(last_error, 4); // 0 le0 le1 le2 in FLAC__fixed_compute_best_predictor_wide_intrin_sse2() [all …]
|
D | fixed_intrin_ssse3.c | 87 last_error = _mm_srli_si128(last_error, 4); // 0 le0 le1 le2 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 89 last_error = _mm_srli_si128(last_error, 4); // 0 0 le0 le1 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 91 last_error = _mm_srli_si128(last_error, 4); // 0 0 0 le0 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 94 …last_error = _mm_add_epi32(last_error, _mm_srli_si128(last_error, 8)); // le0 le1 le2+le0 le3+l… in FLAC__fixed_compute_best_predictor_intrin_ssse3() 95 …last_error = _mm_add_epi32(last_error, _mm_srli_si128(last_error, 4)); // le0 le1+le0 le2+le0+le… in FLAC__fixed_compute_best_predictor_intrin_ssse3() 110 total_err1 = _mm_srli_si128(total_err1, 8); // 0 0 te1 te2 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 113 total_err2 = _mm_srli_si128(total_err2, 4); // 0 te1 te2 te3 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 114 total_err1 = _mm_srli_si128(total_err1, 4); // 0 0 0 te1 in FLAC__fixed_compute_best_predictor_intrin_ssse3() 178 last_error = _mm_srli_si128(last_error, 4); // 0 le0 le1 le2 in FLAC__fixed_compute_best_predictor_wide_intrin_ssse3() 180 last_error = _mm_srli_si128(last_error, 4); // 0 0 le0 le1 in FLAC__fixed_compute_best_predictor_wide_intrin_ssse3() [all …]
|
/external/libaom/libaom/aom_dsp/x86/ |
D | loopfilter_sse2.c | 56 _mm_srli_si128( in transpose_pq_14_sse2() 66 _mm_srli_si128(ww0, 12), in transpose_pq_14_sse2() 70 _mm_srli_si128( in transpose_pq_14_sse2() 80 _mm_srli_si128(ww1, 12), in transpose_pq_14_sse2() 157 filter = _mm_and_si128(_mm_srli_si128(work, 4), *hev); in filter4_sse2() 182 hev1 = _mm_srli_si128(filter2filter1, 8); in filter4_sse2() 209 filter = _mm_and_si128(_mm_srli_si128(work, 8), *hev); in filter4_dual_sse2() 256 q1q0 = _mm_srli_si128(p1p0, 8); in lpf_internal_4_sse2() 264 flat = _mm_max_epu8(flat, _mm_srli_si128(flat, 4)); in lpf_internal_4_sse2() 272 abs_p1q1 = _mm_srli_si128(abs_p1q1p0q0, 4); /* abs(p1 - q1) */ in lpf_internal_4_sse2() [all …]
|
D | aom_subpixel_8t_intrin_sse2.c | 46 __m128i ss_2 = _mm_srli_si128(srcReg32b1, 2); in aom_filter_block1d16_h4_sse2() 47 __m128i ss_4 = _mm_srli_si128(srcReg32b1, 4); in aom_filter_block1d16_h4_sse2() 54 __m128i ss_1 = _mm_srli_si128(srcReg32b1, 3); in aom_filter_block1d16_h4_sse2() 55 __m128i ss_3 = _mm_srli_si128(srcReg32b1, 5); in aom_filter_block1d16_h4_sse2() 70 ss_2 = _mm_srli_si128(srcReg32b2, 2); in aom_filter_block1d16_h4_sse2() 71 ss_4 = _mm_srli_si128(srcReg32b2, 4); in aom_filter_block1d16_h4_sse2() 78 ss_1 = _mm_srli_si128(srcReg32b2, 3); in aom_filter_block1d16_h4_sse2() 79 ss_3 = _mm_srli_si128(srcReg32b2, 5); in aom_filter_block1d16_h4_sse2() 284 __m128i ss_2 = _mm_srli_si128(srcReg32b1, 2); in aom_filter_block1d8_h4_sse2() 285 __m128i ss_4 = _mm_srli_si128(srcReg32b1, 4); in aom_filter_block1d8_h4_sse2() [all …]
|
D | lpf_common_sse2.h | 41 _mm_srli_si128(w2, 4)); // 01 11 21 31 41 51 xx xx in highbd_transpose6x6_sse2() 45 _mm_srli_si128(w2, 8)); // 02 12 22 32 42 52 xx xx in highbd_transpose6x6_sse2() 51 *d3 = _mm_unpackhi_epi64(ww0, _mm_srli_si128(w2, 4)); // 03 13 23 33 43 53 in highbd_transpose6x6_sse2() 241 *d1 = _mm_srli_si128(*d0, in transpose4x8_8x4_low_sse2() 243 *d2 = _mm_srli_si128(*d0, in transpose4x8_8x4_low_sse2() 245 *d3 = _mm_srli_si128(*d0, in transpose4x8_8x4_low_sse2() 282 *d1 = _mm_srli_si128(ww0, in transpose4x8_8x4_sse2() 284 *d2 = _mm_srli_si128(ww0, in transpose4x8_8x4_sse2() 286 *d3 = _mm_srli_si128(ww0, in transpose4x8_8x4_sse2() 290 *d5 = _mm_srli_si128(ww1, in transpose4x8_8x4_sse2() [all …]
|
D | sse_sse4.c | 24 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum_all, 8)); in summary_all_sse4() 26 const __m128i sum_1x64 = _mm_add_epi64(sum_2x64, _mm_srli_si128(sum_2x64, 8)); in summary_all_sse4() 33 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum32, 8)); in summary_32_sse4() 43 const __m128i v_a01_w = _mm_cvtepu8_epi16(_mm_srli_si128(v_a0, 8)); in sse_w16_sse4_1() 45 const __m128i v_b01_w = _mm_cvtepu8_epi16(_mm_srli_si128(v_b0, 8)); in sse_w16_sse4_1() 240 xx_storel_64(&sse, _mm_add_epi64(sum, _mm_srli_si128(sum, 8))); in aom_highbd_sse_sse4_1() 258 xx_storel_64(&sse, _mm_add_epi64(sum, _mm_srli_si128(sum, 8))); in aom_highbd_sse_sse4_1() 280 xx_storel_64(&sse, _mm_add_epi64(sum, _mm_srli_si128(sum, 8))); in aom_highbd_sse_sse4_1() 310 xx_storel_64(&sse, _mm_add_epi64(sum, _mm_srli_si128(sum, 8))); in aom_highbd_sse_sse4_1() 346 xx_storel_64(&sse, _mm_add_epi64(sum, _mm_srli_si128(sum, 8))); in aom_highbd_sse_sse4_1()
|
/external/libhevc/common/x86/ |
D | ihevc_inter_pred_filters_ssse3_intr.c | 297 mask_high_96b = _mm_srli_si128(mask_low_32b, 12); in ihevc_inter_pred_luma_horz_ssse3() 333 … src_temp2_16x8b = _mm_srli_si128(src_temp1_16x8b, 1); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 338 … src_temp1_16x8b = _mm_srli_si128(src_temp1_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 339 … src_temp2_16x8b = _mm_srli_si128(src_temp2_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 344 … src_temp1_16x8b = _mm_srli_si128(src_temp1_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 345 … src_temp2_16x8b = _mm_srli_si128(src_temp2_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 350 … src_temp1_16x8b = _mm_srli_si128(src_temp1_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 351 … src_temp2_16x8b = _mm_srli_si128(src_temp2_16x8b, 2); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 366 … src_temp12_16x8b = _mm_srli_si128(src_temp11_16x8b, 1); /* row =1 */ in ihevc_inter_pred_luma_horz_ssse3() 371 … src_temp11_16x8b = _mm_srli_si128(src_temp11_16x8b, 2); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() [all …]
|
D | ihevc_chroma_intra_pred_filters_ssse3_intr.c | 354 src_temp3 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_ssse3() 355 src_temp4 = _mm_srli_si128(src_temp4, 8); in ihevc_intra_pred_chroma_dc_ssse3() 356 src_temp7 = _mm_srli_si128(src_temp7, 8); in ihevc_intra_pred_chroma_dc_ssse3() 357 src_temp8 = _mm_srli_si128(src_temp8, 8); in ihevc_intra_pred_chroma_dc_ssse3() 380 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_ssse3() 394 src_temp3 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_ssse3() 395 src_temp4 = _mm_srli_si128(src_temp4, 8); in ihevc_intra_pred_chroma_dc_ssse3() 411 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_ssse3() 422 src_temp4 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_ssse3() 435 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_ssse3() [all …]
|
D | ihevc_chroma_intra_pred_filters_sse42_intr.c | 333 src_temp3 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_sse42() 334 src_temp4 = _mm_srli_si128(src_temp4, 8); in ihevc_intra_pred_chroma_dc_sse42() 335 src_temp7 = _mm_srli_si128(src_temp7, 8); in ihevc_intra_pred_chroma_dc_sse42() 336 src_temp8 = _mm_srli_si128(src_temp8, 8); in ihevc_intra_pred_chroma_dc_sse42() 357 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_sse42() 371 src_temp3 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_sse42() 372 src_temp4 = _mm_srli_si128(src_temp4, 8); in ihevc_intra_pred_chroma_dc_sse42() 386 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_sse42() 397 src_temp4 = _mm_srli_si128(src_temp3, 8); in ihevc_intra_pred_chroma_dc_sse42() 407 temp_sad = _mm_srli_si128(src_temp4, 4); /* Next 32 bits */ in ihevc_intra_pred_chroma_dc_sse42()
|
D | ihevc_intra_pred_filters_ssse3_intr.c | 543 src_temp2 = _mm_srli_si128(src_temp1, 1); in ihevc_intra_pred_ref_filtering_ssse3() 544 src_temp3 = _mm_srli_si128(src_temp2, 1); in ihevc_intra_pred_ref_filtering_ssse3() 559 src_temp5 = _mm_srli_si128(src_temp4, 1); in ihevc_intra_pred_ref_filtering_ssse3() 560 src_temp6 = _mm_srli_si128(src_temp5, 1); in ihevc_intra_pred_ref_filtering_ssse3() 1466 src_temp2 = _mm_srli_si128(src_temp1, 1); in ihevc_intra_pred_luma_horz_ssse3() 1467 src_temp3 = _mm_srli_si128(src_temp1, 2); in ihevc_intra_pred_luma_horz_ssse3() 1468 src_temp4 = _mm_srli_si128(src_temp1, 3); in ihevc_intra_pred_luma_horz_ssse3() 1469 src_temp5 = _mm_srli_si128(src_temp1, 4); in ihevc_intra_pred_luma_horz_ssse3() 1470 src_temp6 = _mm_srli_si128(src_temp1, 5); in ihevc_intra_pred_luma_horz_ssse3() 1471 src_temp7 = _mm_srli_si128(src_temp1, 6); in ihevc_intra_pred_luma_horz_ssse3() [all …]
|
D | ihevc_deblk_ssse3_intr.c | 183 temp_coef0_8x16b = _mm_srli_si128(mask_d_result_4x32b, 4); in ihevc_deblk_luma_vert_ssse3() 184 temp_coef1_8x16b = _mm_srli_si128(mask_d_result_4x32b, 8); in ihevc_deblk_luma_vert_ssse3() 185 mask_16x8b = _mm_srli_si128(mask_d_result_4x32b, 12); in ihevc_deblk_luma_vert_ssse3() 195 temp_coef0_8x16b = _mm_srli_si128(mask_de_result_8x16b, 4); in ihevc_deblk_luma_vert_ssse3() 196 temp_coef1_8x16b = _mm_srli_si128(mask_de_result_8x16b, 8); in ihevc_deblk_luma_vert_ssse3() 197 mask_16x8b = _mm_srli_si128(mask_de_result_8x16b, 12); in ihevc_deblk_luma_vert_ssse3() 379 src_row2_8x16b = _mm_srli_si128(src_row0_8x16b, 8); in ihevc_deblk_luma_vert_ssse3() 380 src_row3_8x16b = _mm_srli_si128(src_row1_8x16b, 8); in ihevc_deblk_luma_vert_ssse3() 525 src_row1_8x16b = _mm_srli_si128(src_row0_8x16b, 8); in ihevc_deblk_luma_vert_ssse3() 526 src_row3_8x16b = _mm_srli_si128(src_row2_8x16b, 8); in ihevc_deblk_luma_vert_ssse3() [all …]
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | highbd_idct4x4_add_sse2.c | 41 temp1[1] = _mm_srli_si128(temp1[0], 4); // 1, 3 in highbd_idct4_small_sse2() 42 temp2[1] = _mm_srli_si128(temp2[0], 4); // 1, 3 in highbd_idct4_small_sse2() 50 temp1[3] = _mm_srli_si128(io[1], 4); in highbd_idct4_small_sse2() 51 temp2[3] = _mm_srli_si128(io[3], 4); in highbd_idct4_small_sse2() 109 max_input = _mm_max_epi16(max_input, _mm_srli_si128(max_input, 8)); in vpx_highbd_idct4x4_16_add_sse2() 110 min_input = _mm_min_epi16(min_input, _mm_srli_si128(min_input, 8)); in vpx_highbd_idct4x4_16_add_sse2() 111 max_input = _mm_max_epi16(max_input, _mm_srli_si128(max_input, 4)); in vpx_highbd_idct4x4_16_add_sse2() 112 min_input = _mm_min_epi16(min_input, _mm_srli_si128(min_input, 4)); in vpx_highbd_idct4x4_16_add_sse2() 113 max_input = _mm_max_epi16(max_input, _mm_srli_si128(max_input, 2)); in vpx_highbd_idct4x4_16_add_sse2() 114 min_input = _mm_min_epi16(min_input, _mm_srli_si128(min_input, 2)); in vpx_highbd_idct4x4_16_add_sse2()
|
D | highbd_intrapred_intrin_sse2.c | 217 const __m128i _dcba = _mm_add_epi16(ref_u16, _mm_srli_si128(ref_u16, 8)); in dc_sum_8() 406 const __m128i JIXABCD0 = _mm_srli_si128(KJIXABCD, 2); in vpx_highbd_d117_predictor_4x4_sse2() 407 const __m128i IXABCD00 = _mm_srli_si128(KJIXABCD, 4); in vpx_highbd_d117_predictor_4x4_sse2() 410 const __m128i row0 = _mm_srli_si128(avg2, 6); in vpx_highbd_d117_predictor_4x4_sse2() 411 const __m128i row1 = _mm_srli_si128(avg3, 4); in vpx_highbd_d117_predictor_4x4_sse2() 412 const __m128i row2 = _mm_srli_si128(avg2, 4); in vpx_highbd_d117_predictor_4x4_sse2() 413 const __m128i row3 = _mm_srli_si128(avg3, 2); in vpx_highbd_d117_predictor_4x4_sse2() 439 const __m128i JIXABCD0 = _mm_srli_si128(KJIXABCD, 2); in vpx_highbd_d135_predictor_4x4_sse2() 442 const __m128i row0 = _mm_srli_si128(avg3, 6); in vpx_highbd_d135_predictor_4x4_sse2() 443 const __m128i row1 = _mm_srli_si128(avg3, 4); in vpx_highbd_d135_predictor_4x4_sse2() [all …]
|
D | vpx_subpixel_4t_intrin_sse2.c | 56 src_reg_shift_1 = _mm_srli_si128(src_reg, 1); in vpx_filter_block1d16_h4_sse2() 57 src_reg_shift_2 = _mm_srli_si128(src_reg, 2); in vpx_filter_block1d16_h4_sse2() 58 src_reg_shift_3 = _mm_srli_si128(src_reg, 3); in vpx_filter_block1d16_h4_sse2() 73 src_reg_shift_1 = _mm_srli_si128(src_reg, 1); in vpx_filter_block1d16_h4_sse2() 74 src_reg_shift_2 = _mm_srli_si128(src_reg, 2); in vpx_filter_block1d16_h4_sse2() 75 src_reg_shift_3 = _mm_srli_si128(src_reg, 3); in vpx_filter_block1d16_h4_sse2() 292 src_reg_shift_1 = _mm_srli_si128(src_reg, 1); in vpx_filter_block1d8_h4_sse2() 293 src_reg_shift_2 = _mm_srli_si128(src_reg, 2); in vpx_filter_block1d8_h4_sse2() 294 src_reg_shift_3 = _mm_srli_si128(src_reg, 3); in vpx_filter_block1d8_h4_sse2() 469 src_reg_shift_1 = _mm_srli_si128(src_reg, 1); in vpx_filter_block1d4_h4_sse2() [all …]
|
/external/libhevc/decoder/x86/ |
D | ihevcd_it_rec_dc_sse42_intr.c | 115 m_temp_reg_1 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_luma_sse42() 116 m_temp_reg_2 = _mm_srli_si128(m_temp_reg_8, 8); in ihevcd_itrans_recon_dc_luma_sse42() 117 m_temp_reg_3 = _mm_srli_si128(m_temp_reg_8, 12); in ihevcd_itrans_recon_dc_luma_sse42() 163 m_temp_reg_13 = _mm_srli_si128(m_temp_reg_12, 8); in ihevcd_itrans_recon_dc_luma_sse42() 173 m_temp_reg_15 = _mm_srli_si128(m_temp_reg_14, 8); in ihevcd_itrans_recon_dc_luma_sse42() 277 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_sse42() 279 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_sse42() 281 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_sse42() 351 m_temp_reg_4 = _mm_srli_si128(m_temp_reg_4, 8); in ihevcd_itrans_recon_dc_chroma_sse42() 355 m_temp_reg_5 = _mm_srli_si128(m_temp_reg_5, 8); in ihevcd_itrans_recon_dc_chroma_sse42() [all …]
|
D | ihevcd_it_rec_dc_ssse3_intr.c | 116 m_temp_reg_1 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_luma_ssse3() 117 m_temp_reg_2 = _mm_srli_si128(m_temp_reg_8, 8); in ihevcd_itrans_recon_dc_luma_ssse3() 118 m_temp_reg_3 = _mm_srli_si128(m_temp_reg_8, 12); in ihevcd_itrans_recon_dc_luma_ssse3() 164 m_temp_reg_13 = _mm_srli_si128(m_temp_reg_12, 8); in ihevcd_itrans_recon_dc_luma_ssse3() 174 m_temp_reg_15 = _mm_srli_si128(m_temp_reg_14, 8); in ihevcd_itrans_recon_dc_luma_ssse3() 277 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_ssse3() 279 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_ssse3() 281 m_temp_reg_8 = _mm_srli_si128(m_temp_reg_8, 4); in ihevcd_itrans_recon_dc_chroma_ssse3() 351 m_temp_reg_4 = _mm_srli_si128(m_temp_reg_4, 8); in ihevcd_itrans_recon_dc_chroma_ssse3() 355 m_temp_reg_5 = _mm_srli_si128(m_temp_reg_5, 8); in ihevcd_itrans_recon_dc_chroma_ssse3() [all …]
|
/external/libaom/libaom/av1/common/x86/ |
D | convolve_sse2.c | 269 s[0] = _mm_unpacklo_epi8(data, _mm_srli_si128(data, 1)); in av1_convolve_x_sr_sse2() 271 _mm_unpacklo_epi8(_mm_srli_si128(data, 2), _mm_srli_si128(data, 3)); in av1_convolve_x_sr_sse2() 273 _mm_unpacklo_epi8(_mm_srli_si128(data, 4), _mm_srli_si128(data, 5)); in av1_convolve_x_sr_sse2() 275 _mm_unpacklo_epi8(_mm_srli_si128(data, 6), _mm_srli_si128(data, 7)); in av1_convolve_x_sr_sse2() 306 s[1] = _mm_srli_si128(data, 2); in av1_convolve_x_sr_sse2() 307 s[2] = _mm_srli_si128(data, 4); in av1_convolve_x_sr_sse2() 308 s[3] = _mm_srli_si128(data, 6); in av1_convolve_x_sr_sse2() 312 s[0] = _mm_srli_si128(data, 1); in av1_convolve_x_sr_sse2() 313 s[1] = _mm_srli_si128(data, 3); in av1_convolve_x_sr_sse2() 314 s[2] = _mm_srli_si128(data, 5); in av1_convolve_x_sr_sse2() [all …]
|
D | jnt_convolve_sse2.c | 60 s[0] = _mm_unpacklo_epi8(data, _mm_srli_si128(data, 1)); in av1_dist_wtd_convolve_x_sse2() 62 _mm_unpacklo_epi8(_mm_srli_si128(data, 2), _mm_srli_si128(data, 3)); in av1_dist_wtd_convolve_x_sse2() 64 _mm_unpacklo_epi8(_mm_srli_si128(data, 4), _mm_srli_si128(data, 5)); in av1_dist_wtd_convolve_x_sse2() 66 _mm_unpacklo_epi8(_mm_srli_si128(data, 6), _mm_srli_si128(data, 7)); in av1_dist_wtd_convolve_x_sse2() 106 s[1] = _mm_srli_si128(data, 2); in av1_dist_wtd_convolve_x_sse2() 107 s[2] = _mm_srli_si128(data, 4); in av1_dist_wtd_convolve_x_sse2() 108 s[3] = _mm_srli_si128(data, 6); in av1_dist_wtd_convolve_x_sse2() 112 s[0] = _mm_srli_si128(data, 1); in av1_dist_wtd_convolve_x_sse2() 113 s[1] = _mm_srli_si128(data, 3); in av1_dist_wtd_convolve_x_sse2() 114 s[2] = _mm_srli_si128(data, 5); in av1_dist_wtd_convolve_x_sse2() [all …]
|
D | wiener_convolve_sse2.c | 75 const __m128i src_2 = _mm_unpacklo_epi8(_mm_srli_si128(data, 2), zero); in av1_wiener_convolve_add_src_sse2() 77 const __m128i src_4 = _mm_unpacklo_epi8(_mm_srli_si128(data, 4), zero); in av1_wiener_convolve_add_src_sse2() 79 const __m128i src_6 = _mm_unpacklo_epi8(_mm_srli_si128(data, 6), zero); in av1_wiener_convolve_add_src_sse2() 88 const __m128i src_1 = _mm_unpacklo_epi8(_mm_srli_si128(data, 1), zero); in av1_wiener_convolve_add_src_sse2() 90 const __m128i src_3 = _mm_unpacklo_epi8(_mm_srli_si128(data, 3), zero); in av1_wiener_convolve_add_src_sse2() 92 const __m128i src_5 = _mm_unpacklo_epi8(_mm_srli_si128(data, 5), zero); in av1_wiener_convolve_add_src_sse2() 94 const __m128i src_7 = _mm_unpacklo_epi8(_mm_srli_si128(data, 7), zero); in av1_wiener_convolve_add_src_sse2()
|
/external/libaom/libaom/aom_dsp/simd/ |
D | v64_intrinsics_x86.h | 30 return (uint32_t)_mm_cvtsi128_si32(_mm_srli_si128(a, 4)); in v64_high_u32() 36 return (int32_t)_mm_cvtsi128_si32(_mm_srli_si128(a, 4)); in v64_high_s32() 95 ((c) ? _mm_srli_si128(_mm_unpacklo_epi64(b, a), (c)) : b) 156 return _mm_srli_si128(_mm_unpacklo_epi8(b, a), 8); in v64_ziphi_8() 162 return _mm_srli_si128(_mm_unpacklo_epi16(b, a), 8); in v64_ziphi_16() 168 return _mm_srli_si128(_mm_unpacklo_epi32(b, a), 8); in v64_ziphi_32() 247 return _mm_srli_si128(_mm_unpacklo_epi8(a, _mm_setzero_si128()), 8); in v64_unpackhi_u8_s16() 255 return _mm_srli_si128(_mm_srai_epi16(_mm_unpacklo_epi8(a, a), 8), 8); in v64_unpackhi_s8_s16() 267 return _mm_srli_si128(_mm_unpacklo_epi16(a, _mm_setzero_si128()), 8); in v64_unpackhi_u16_s32() 271 return _mm_srli_si128( in v64_unpackhi_s16_s32() [all …]
|
D | v128_intrinsics_x86.h | 28 SIMD_INLINE v64 v128_high_v64(v128 a) { return _mm_srli_si128(a, 8); } in v128_high_v64() 71 ((c) ? _mm_or_si128(_mm_srli_si128(b, c), _mm_slli_si128(a, 16 - (c))) : (b)) 78 ((c) ? _mm_or_si128(_mm_srli_si128(b, c), _mm_slli_si128(a, 16 - (c))) : (b)) 321 t = v128_add_32(t, _mm_srli_si128(t, 8)); in v128_dotp_su8() 322 t = v128_add_32(t, _mm_srli_si128(t, 4)); in v128_dotp_su8() 330 _mm_cvtepi32_epi64(_mm_srli_si128(r, 8))); in v128_dotp_s16() 331 return _mm_cvtsi128_si64(_mm_add_epi64(c, _mm_srli_si128(c, 8))); in v128_dotp_s16() 334 (int64_t)_mm_cvtsi128_si32(_mm_srli_si128(r, 4)) + in v128_dotp_s16() 335 (int64_t)_mm_cvtsi128_si32(_mm_srli_si128(r, 8)) + in v128_dotp_s16() 336 (int64_t)_mm_cvtsi128_si32(_mm_srli_si128(r, 12)); in v128_dotp_s16() [all …]
|
/external/libavc/encoder/x86/ |
D | ih264e_half_pel_ssse3.c | 135 …src_r0_sht_16x8b = _mm_srli_si128(src_r0_16x8b, 1); //a1 a2 a3 a4 a5 a6 a7 a8… in ih264e_sixtapfilter_horz_ssse3() 136 …src_r1_sht_16x8b = _mm_srli_si128(src_r1_16x8b, 1); //b1 b2 b3 b4 b5 b6 b7 b8… in ih264e_sixtapfilter_horz_ssse3() 146 …src_r0_16x8b = _mm_srli_si128(src_r0_16x8b, 2); //a2 a3 a4 a5 a6 a7 a8 a9… in ih264e_sixtapfilter_horz_ssse3() 147 …src_r1_16x8b = _mm_srli_si128(src_r1_16x8b, 2); //b2 b3 b4 b5 b6 b7 b8 b9… in ih264e_sixtapfilter_horz_ssse3() 149 …src_r0_sht_16x8b = _mm_srli_si128(src_r0_sht_16x8b, 2); //a3 a4 a5 a6 a7 a8 a9...… in ih264e_sixtapfilter_horz_ssse3() 150 …src_r1_sht_16x8b = _mm_srli_si128(src_r1_sht_16x8b, 2); //b3 b4 b5 b6 b7 b8 b9...… in ih264e_sixtapfilter_horz_ssse3() 160 …src_r0_16x8b = _mm_srli_si128(src_r0_16x8b, 2); //a4 a5 a6 a7 a8 a9....a1… in ih264e_sixtapfilter_horz_ssse3() 161 …src_r1_16x8b = _mm_srli_si128(src_r1_16x8b, 2); //b4 b5 b6 b7 b8 b9....b1… in ih264e_sixtapfilter_horz_ssse3() 163 …src_r0_sht_16x8b = _mm_srli_si128(src_r0_sht_16x8b, 2); //a5 a6 a7 a8 a9....a15 0… in ih264e_sixtapfilter_horz_ssse3() 164 …src_r1_sht_16x8b = _mm_srli_si128(src_r1_sht_16x8b, 2); //b5 b6 b7 b8 b9....b15 0… in ih264e_sixtapfilter_horz_ssse3()
|
/external/clang/test/CodeGen/ |
D | sse.c | 31 return _mm_srli_si128(a, 5); in test_mm_srli_si128() 37 return _mm_srli_si128(a, 0); in test_mm_srli_si128_0() 43 return _mm_srli_si128(a, 16); in test_mm_srli_si128_16()
|