Home
last modified time | relevance | path

Searched refs:_mm_hadd_epi32 (Results 1 – 24 of 24) sorted by relevance

/external/libgav1/libgav1/src/dsp/x86/
Dsuper_res_sse4.cc82 const __m128i res0 = _mm_hadd_epi32(weighted_src[0], weighted_src[1]); in ComputeSuperRes4()
83 const __m128i res1 = _mm_hadd_epi32(weighted_src[2], weighted_src[3]); in ComputeSuperRes4()
84 const __m128i result0 = _mm_hadd_epi32(res0, res1); in ComputeSuperRes4()
103 const __m128i res0 = _mm_hadd_epi32(weighted_src[0], weighted_src[1]); in ComputeSuperRes8()
104 const __m128i res1 = _mm_hadd_epi32(weighted_src[2], weighted_src[3]); in ComputeSuperRes8()
105 const __m128i res2 = _mm_hadd_epi32(weighted_src[4], weighted_src[5]); in ComputeSuperRes8()
106 const __m128i res3 = _mm_hadd_epi32(weighted_src[6], weighted_src[7]); in ComputeSuperRes8()
107 const __m128i result0 = _mm_hadd_epi32(res0, res1); in ComputeSuperRes8()
108 const __m128i result1 = _mm_hadd_epi32(res2, res3); in ComputeSuperRes8()
Dcdef_sse4.cc338 a = _mm_hadd_epi32(a, a); in SumVector_S32()
/external/libaom/libaom/av1/common/x86/
Dav1_convolve_horiz_rs_sse4.c105 const __m128i conv01_32 = _mm_hadd_epi32(conv0_32, conv1_32); in av1_convolve_horiz_rs_sse4_1()
106 const __m128i conv23_32 = _mm_hadd_epi32(conv2_32, conv3_32); in av1_convolve_horiz_rs_sse4_1()
108 const __m128i conv0123_32 = _mm_hadd_epi32(conv01_32, conv23_32); in av1_convolve_horiz_rs_sse4_1()
208 const __m128i conv01_32 = _mm_hadd_epi32(conv0_32, conv1_32); in av1_highbd_convolve_horiz_rs_sse4_1()
209 const __m128i conv23_32 = _mm_hadd_epi32(conv2_32, conv3_32); in av1_highbd_convolve_horiz_rs_sse4_1()
211 const __m128i conv0123_32 = _mm_hadd_epi32(conv01_32, conv23_32); in av1_highbd_convolve_horiz_rs_sse4_1()
Dav1_convolve_scale_sse4.c75 const __m128i conv01lo = _mm_hadd_epi32(conv0lo, conv1lo); in hfilter8()
76 const __m128i conv23lo = _mm_hadd_epi32(conv2lo, conv3lo); in hfilter8()
77 const __m128i conv = _mm_hadd_epi32(conv01lo, conv23lo); in hfilter8()
161 const __m128i conv01 = _mm_hadd_epi32(conv0, conv1); in vfilter8()
162 const __m128i conv23 = _mm_hadd_epi32(conv2, conv3); in vfilter8()
163 __m128i conv = _mm_hadd_epi32(conv01, conv23); in vfilter8()
305 const __m128i conv01lo = _mm_hadd_epi32(conv0lo, conv1lo); in highbd_hfilter8()
306 const __m128i conv23lo = _mm_hadd_epi32(conv2lo, conv3lo); in highbd_hfilter8()
307 const __m128i conv = _mm_hadd_epi32(conv01lo, conv23lo); in highbd_hfilter8()
392 const __m128i conv01 = _mm_hadd_epi32(conv0, conv1); in highbd_vfilter8()
[all …]
/external/libaom/libaom/aom_dsp/x86/
Dhighbd_variance_sse4.c54 s2 = _mm_hadd_epi32(t0, t1); in variance4x4_64_sse4_1()
55 s3 = _mm_hadd_epi32(s2, s2); in variance4x4_64_sse4_1()
56 y0 = _mm_hadd_epi32(s3, s3); in variance4x4_64_sse4_1()
61 s2 = _mm_hadd_epi32(t0, t1); in variance4x4_64_sse4_1()
62 s3 = _mm_hadd_epi32(s2, s2); in variance4x4_64_sse4_1()
63 x0 = _mm_hadd_epi32(s3, s3); in variance4x4_64_sse4_1()
Dobmc_intrinsic_ssse3.h20 v_d = _mm_hadd_epi32(v_d, v_d); in xx_hsum_epi32_si32()
21 v_d = _mm_hadd_epi32(v_d, v_d); in xx_hsum_epi32_si32()
Dmasked_sad_intrin_ssse3.c338 res = _mm_hadd_epi32(res, res); in highbd_masked_sad_ssse3()
339 res = _mm_hadd_epi32(res, res); in highbd_masked_sad_ssse3()
398 res = _mm_hadd_epi32(res, res); in aom_highbd_masked_sad4xh_ssse3()
399 res = _mm_hadd_epi32(res, res); in aom_highbd_masked_sad4xh_ssse3()
Dobmc_variance_avx2.c77 v_d = _mm_hadd_epi32(v_sum_d, v_sse_d); in obmc_variance_w8n()
78 v_d = _mm_hadd_epi32(v_d, v_d); in obmc_variance_w8n()
Dmasked_variance_intrin_ssse3.c452 sum = _mm_hadd_epi32(sum, sum_sq); in masked_variance()
453 sum = _mm_hadd_epi32(sum, sum); in masked_variance()
482 sum = _mm_hadd_epi32(sum, sum_sq); in masked_variance8xh()
483 sum = _mm_hadd_epi32(sum, sum); in masked_variance8xh()
514 sum = _mm_hadd_epi32(sum, sum_sq); in masked_variance4xh()
515 sum = _mm_hadd_epi32(sum, sum); in masked_variance4xh()
958 sum = _mm_hadd_epi32(sum, zero); in highbd_masked_variance()
959 sum = _mm_hadd_epi32(sum, zero); in highbd_masked_variance()
1024 sum = _mm_hadd_epi32(sum, sum_sq); in highbd_masked_variance4xh()
1025 sum = _mm_hadd_epi32(sum, zero); in highbd_masked_variance4xh()
/external/flac/libFLAC/
Dstream_encoder_intrin_ssse3.c89 mm_sum = _mm_hadd_epi32(mm_sum, mm_sum); in FLAC__precompute_partition_info_sums_intrin_ssse3()
90 mm_sum = _mm_hadd_epi32(mm_sum, mm_sum); in FLAC__precompute_partition_info_sums_intrin_ssse3()
Dstream_encoder_intrin_avx2.c86 sum128 = _mm_hadd_epi32(sum128, sum128); in FLAC__precompute_partition_info_sums_intrin_avx2()
87 sum128 = _mm_hadd_epi32(sum128, sum128); in FLAC__precompute_partition_info_sums_intrin_avx2()
/external/libaom/libaom/av1/encoder/x86/
Drdopt_sse4.c50 const __m128i xy32 = _mm_hadd_epi32(xy_madd_b, xy_madd_a); in horver_correlation_4x4()
62 const __m128i xz32 = _mm_hadd_epi32(xz_madd_b, xz_madd_a); in horver_correlation_4x4()
82 const __m128i sum2 = _mm_hadd_epi32(slli_a_2, swap_b_2); in horver_correlation_4x4()
Dtemporal_filter_sse4.c1500 y_reg_fst = _mm_hadd_epi32(y_fst, y_snd); in highbd_add_luma_dist_to_8_chroma_mod()
1512 y_reg_snd = _mm_hadd_epi32(y_fst, y_snd); in highbd_add_luma_dist_to_8_chroma_mod()
/external/tensorflow/tensorflow/lite/kernels/internal/optimized/
Dsse_tensor_utils.cc48 acc = _mm_hadd_epi32(acc, acc); in ReduceInt32x4()
52 acc = _mm_hadd_epi32(acc, acc); in ReduceInt32x4()
/external/XNNPACK/src/q8-gemm/
D2x4c8-sse2.c20 const __m128i xxyy = _mm_hadd_epi32(x, y); in sse_reduce4_i32()
22 const __m128i zzww = _mm_hadd_epi32(z, w); in sse_reduce4_i32()
24 return _mm_hadd_epi32(xxyy, zzww); in sse_reduce4_i32()
/external/libavc/common/x86/
Dih264_ihadamard_scaling_sse42.c221 temp0 = _mm_hadd_epi32(plane_0, plane_1); //a0+a1 a2+a3 b0+b1 b2+b3 in ih264_ihadamard_scaling_2x2_uv_sse42()
223 …plane_0 = _mm_hadd_epi32(temp0, temp1); //a0+a1+a2+a3 b0+b1+b2+b3 a0-a1+a2-a3 b0-b1+b2… in ih264_ihadamard_scaling_2x2_uv_sse42()
Dih264_chroma_intra_pred_filters_ssse3.c292 hv_val_4x32b = _mm_hadd_epi32(h_val_4x32b, v_val_4x32b); in ih264_intra_pred_chroma_8x8_mode_plane_ssse3()
Dih264_resi_trans_quant_sse42.c918 temp0 = _mm_hadd_epi32(plane_0, plane_1); //a0+a1 a2+a3 b0+b1 b2+b3 in ih264_hadamard_quant_2x2_uv_sse42()
921 …plane_0 = _mm_hadd_epi32(temp0, temp1); //a0+a1+a2+a3 b0+b1+b2+b3 a0-a1+a2-a3 b0-b1+b2… in ih264_hadamard_quant_2x2_uv_sse42()
Dih264_luma_intra_pred_filters_ssse3.c2055 hv_val_4x32b = _mm_hadd_epi32(h_val_4x32b, v_val_4x32b); in ih264_intra_pred_luma_16x16_mode_plane_ssse3()
2056 hv_val_4x32b = _mm_hadd_epi32(hv_val_4x32b, hv_val_4x32b); in ih264_intra_pred_luma_16x16_mode_plane_ssse3()
/external/clang/test/CodeGen/
Dssse3-builtins.c49 return _mm_hadd_epi32(a, b); in test_mm_hadd_epi32()
/external/eigen/Eigen/src/Core/arch/SSE/
DPacketMath.h561 return _mm_hadd_epi32(_mm_hadd_epi32(vecs[0], vecs[1]),_mm_hadd_epi32(vecs[2], vecs[3]));
565 Packet4i tmp0 = _mm_hadd_epi32(a,a);
566 return pfirst<Packet4i>(_mm_hadd_epi32(tmp0,tmp0));
/external/clang/lib/Headers/
Dtmmintrin.h227 _mm_hadd_epi32(__m128i __a, __m128i __b) in _mm_hadd_epi32() function
/external/libvpx/libvpx/vp9/encoder/x86/
Dhighbd_temporal_filter_sse4.c468 y_reg_fst = _mm_hadd_epi32(y_fst, y_snd); in highbd_add_luma_dist_to_8_chroma_mod()
480 y_reg_snd = _mm_hadd_epi32(y_fst, y_snd); in highbd_add_luma_dist_to_8_chroma_mod()
/external/neon_2_sse/
DNEON_2_SSE.h6289 hadd128 = _mm_hadd_epi32 (_pM128i(a), _pM128i(b)); in vpadd_s32()
6376 r32_1 = _mm_hadd_epi32(r32_1, r32_1); //use low 64 bits in vpaddl_s16()
6439 return _mm_hadd_epi32 (r32_1, r32_2); in vpaddlq_s16()