/external/libaom/libaom/aom_dsp/x86/ |
D | loopfilter_sse2.c | 141 static AOM_FORCE_INLINE void filter4_sse2(__m128i *p1p0, __m128i *q1q0, in filter4_sse2() argument 153 qs1qs0_work = _mm_xor_si128(*q1q0, t80); in filter4_sse2() 192 static AOM_FORCE_INLINE void filter4_dual_sse2(__m128i *p1p0, __m128i *q1q0, in filter4_dual_sse2() argument 205 qs1qs0_work = _mm_xor_si128(*q1q0, t80); in filter4_dual_sse2() 247 __m128i q1p1, q0p0, p1p0, q1q0; in lpf_internal_4_sse2() local 256 q1q0 = _mm_srli_si128(p1p0, 8); in lpf_internal_4_sse2() 261 __m128i abs_p1q1p0q0 = abs_diff(p1p0, q1q0); in lpf_internal_4_sse2() 284 filter4_sse2(&p1p0, &q1q0, &hev, &mask, q1q0_out, p1p0_out); in lpf_internal_4_sse2() 290 __m128i q1p1, q0p0, p1p0, q1q0; in lpf_internal_4_dual_sse2() local 299 q1q0 = _mm_unpackhi_epi64(q0p0, q1p1); in lpf_internal_4_dual_sse2() [all …]
|
D | highbd_loopfilter_sse2.c | 109 __m128i *p1p0, __m128i *q1q0, in highbd_hev_filter_mask_x_sse2() argument 120 *q1q0 = _mm_unpackhi_epi64(pq[0], pq[1]); in highbd_hev_filter_mask_x_sse2() 122 abs_p0q0_p1q1 = abs_diff16(*p1p0, *q1q0); in highbd_hev_filter_mask_x_sse2() 213 static AOM_FORCE_INLINE void highbd_filter4_sse2(__m128i *p1p0, __m128i *q1q0, in highbd_filter4_sse2() argument 229 qs1qs0_work = _mm_subs_epi16(*q1q0, *t80); in highbd_filter4_sse2() 339 __m128i p1p0, q1q0, abs_p1p0; in highbd_lpf_internal_14_sse2() local 341 highbd_hev_filter_mask_x_sse2(pq, 4, &p1p0, &q1q0, &abs_p1p0, &limit, &blimit, in highbd_lpf_internal_14_sse2() 346 highbd_filter4_sse2(&p1p0, &q1q0, &hevhev, &mask, &qs0qs1, &ps0ps1, &t80, bd); in highbd_lpf_internal_14_sse2() 743 __m128i p1p0, q1q0, abs_p1p0, ps1ps0, qs1qs0; in highbd_lpf_internal_6_sse2() local 757 highbd_hev_filter_mask_x_sse2(pq, 3, &p1p0, &q1q0, &abs_p1p0, &limit, &blimit, in highbd_lpf_internal_6_sse2() [all …]
|
/external/libgav1/libgav1/src/dsp/x86/ |
D | loop_filter_sse4.cc | 52 inline __m128i CheckOuterThreshF4(const __m128i& q1q0, const __m128i& p1p0, in CheckOuterThreshF4() argument 56 const __m128i abs_pmq = AbsDiff(p1p0, q1q0); in CheckOuterThreshF4() 91 inline __m128i NeedsFilter4(const __m128i& q1q0, const __m128i& p1p0, in NeedsFilter4() argument 95 const __m128i outer_mask = CheckOuterThreshF4(q1q0, p1p0, outer_thresh); in NeedsFilter4() 159 const __m128i q1q0 = _mm_unpacklo_epi32(q0, q1); in Horizontal4() local 164 NeedsFilter4(q1q0, p1p0, qp1, qp0, v_outer_thresh, v_inner_thresh); in Horizontal4() 230 const __m128i q1q0 = _mm_srli_si128(d0, 8); in Vertical4() local 235 NeedsFilter4(q1q0, p1p0, qp1, qp0, v_outer_thresh, v_inner_thresh); in Vertical4() 257 inline __m128i NeedsFilter6(const __m128i& q1q0, const __m128i& p1p0, in NeedsFilter6() argument 261 const __m128i outer_mask = CheckOuterThreshF4(q1q0, p1p0, outer_thresh); in NeedsFilter6() [all …]
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | loopfilter_sse2.c | 28 const __m128i abs_p1q1p0q0 = abs_diff(p1p0, q1q0); \ 68 qs1qs0 = _mm_xor_si128(q1q0, t80); \ 116 __m128i q1p1, q0p0, p3p2, p2p1, p1p0, q3q2, q2q1, q1q0, ps1ps0, qs1qs0; in vpx_lpf_horizontal_4_sse2() local 129 q1q0 = _mm_unpackhi_epi64(q0p0, q1p1); in vpx_lpf_horizontal_4_sse2() 151 __m128i q1p1, q0p0, p3p2, p2p1, p1p0, q3q2, q2q1, q1q0, ps1ps0, qs1qs0; in vpx_lpf_vertical_4_sse2() local 155 q1q0 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(s + 0 * pitch - 4)), in vpx_lpf_vertical_4_sse2() 172 p1p0 = _mm_unpacklo_epi16(q1q0, x1); in vpx_lpf_vertical_4_sse2() 183 q1q0 = _mm_unpackhi_epi16(q1q0, x1); in vpx_lpf_vertical_4_sse2() 187 q3q2 = _mm_unpackhi_epi32(q1q0, x2); in vpx_lpf_vertical_4_sse2() 189 q1q0 = _mm_unpacklo_epi32(q1q0, x2); in vpx_lpf_vertical_4_sse2() [all …]
|