Home
last modified time | relevance | path

Searched refs:res_lo (Results 1 – 25 of 28) sorted by relevance

12

/external/libaom/libaom/av1/common/x86/
Dhighbd_warp_plane_sse4.c533 __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_warp_affine_sse4_1() local
540 res_lo = _mm_add_epi32(res_lo, res_add_const); in av1_highbd_warp_affine_sse4_1()
541 res_lo = _mm_sra_epi32(_mm_add_epi32(res_lo, reduce_bits_vert_const), in av1_highbd_warp_affine_sse4_1()
549 res_lo = _mm_add_epi32(_mm_mullo_epi32(p_32, wt0), in av1_highbd_warp_affine_sse4_1()
550 _mm_mullo_epi32(res_lo, wt1)); in av1_highbd_warp_affine_sse4_1()
551 res_lo = _mm_srai_epi32(res_lo, DIST_PRECISION_BITS); in av1_highbd_warp_affine_sse4_1()
553 res_lo = _mm_srai_epi32(_mm_add_epi32(p_32, res_lo), 1); in av1_highbd_warp_affine_sse4_1()
556 __m128i res32_lo = _mm_add_epi32(res_lo, res_sub_const); in av1_highbd_warp_affine_sse4_1()
564 res_lo = _mm_packus_epi32(res_lo, res_lo); in av1_highbd_warp_affine_sse4_1()
565 _mm_storel_epi64(p, res_lo); in av1_highbd_warp_affine_sse4_1()
[all …]
Dconvolve_sse2.c167 __m128i s[8], src6, res_lo, res_hi; in av1_convolve_y_sr_sse2() local
199 res_lo = convolve_lo_y(s, coeffs); // Filter low index pixels in av1_convolve_y_sr_sse2()
203 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_convolve_y_sr_sse2()
213 res_lo = convolve_lo_y(s + 1, coeffs); // Filter low index pixels in av1_convolve_y_sr_sse2()
217 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_convolve_y_sr_sse2()
276 const __m128i res_lo = convolve_lo_x(s, coeffs); in av1_convolve_x_sr_sse2() local
278 _mm_sra_epi32(_mm_add_epi32(res_lo, round_0_const), round_0_shift); in av1_convolve_x_sr_sse2()
319 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_convolve_x_sr_sse2() local
322 _mm_sra_epi32(_mm_add_epi32(res_lo, round_0_const), round_0_shift); in av1_convolve_x_sr_sse2()
Dwarp_plane_sse4.c544 __m128i *res_lo, __m128i *res_hi, in filter_src_pixels_vertical() argument
577 *res_lo = _mm_unpacklo_epi32(res_even, res_odd); in filter_src_pixels_vertical()
582 __m128i *res_lo, __m128i *res_hi, const __m128i *res_add_const, in store_vertical_filter_output() argument
587 __m128i res_lo_1 = *res_lo; in store_vertical_filter_output()
693 __m128i res_lo; in warp_vertical_filter() local
695 filter_src_pixels_vertical(tmp, coeffs, &res_lo, &res_hi, k); in warp_vertical_filter()
697 store_vertical_filter_output(&res_lo, &res_hi, res_add_const, &wt, in warp_vertical_filter()
721 __m128i res_lo; in warp_vertical_filter_gamma0() local
723 filter_src_pixels_vertical(tmp, coeffs, &res_lo, &res_hi, k); in warp_vertical_filter_gamma0()
725 store_vertical_filter_output(&res_lo, &res_hi, res_add_const, &wt, in warp_vertical_filter_gamma0()
[all …]
Djnt_convolve_sse2.c67 const __m128i res_lo = convolve_lo_x(s, coeffs); in av1_dist_wtd_convolve_x_sse2() local
69 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_dist_wtd_convolve_x_sse2()
119 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_x_sse2() local
122 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_dist_wtd_convolve_x_sse2()
285 __m128i s[8], src6, res_lo, res_hi, res_lo_shift, res_hi_shift; in av1_dist_wtd_convolve_y_sse2() local
316 res_lo = convolve_lo_y(s, coeffs); // Filter low index pixels in av1_dist_wtd_convolve_y_sse2()
318 res_lo_shift = _mm_sll_epi32(res_lo, left_shift); in av1_dist_wtd_convolve_y_sse2()
346 res_lo = convolve_lo_y(s + 1, coeffs); // Filter low index pixels in av1_dist_wtd_convolve_y_sse2()
348 res_lo_shift = _mm_sll_epi32(res_lo, left_shift); in av1_dist_wtd_convolve_y_sse2()
580 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_sse2() local
[all …]
Djnt_convolve_avx2.c272 __m256i res_lo = convolve_lowbd_4tap(s, coeffs + 1); in av1_dist_wtd_convolve_y_avx2() local
274 res_lo = _mm256_add_epi16(res_lo, offset_const_1); in av1_dist_wtd_convolve_y_avx2()
276 const __m256i res_lo_0_32b = _mm256_unpacklo_epi16(res_lo, zero); in av1_dist_wtd_convolve_y_avx2()
282 const __m256i res_lo_1_32b = _mm256_unpackhi_epi16(res_lo, zero); in av1_dist_wtd_convolve_y_avx2()
451 __m256i res_lo = convolve_lowbd(s, coeffs); in av1_dist_wtd_convolve_y_avx2() local
453 res_lo = _mm256_add_epi16(res_lo, offset_const_1); in av1_dist_wtd_convolve_y_avx2()
455 const __m256i res_lo_0_32b = _mm256_unpacklo_epi16(res_lo, zero); in av1_dist_wtd_convolve_y_avx2()
461 const __m256i res_lo_1_32b = _mm256_unpackhi_epi16(res_lo, zero); in av1_dist_wtd_convolve_y_avx2()
Dwarp_plane_avx2.c627 __m256i *res_lo, in filter_src_pixels_vertical_avx2() argument
654 *res_lo = _mm256_unpacklo_epi32(res_even, res_odd); in filter_src_pixels_vertical_avx2()
659 const __m256i *res_lo, const __m256i *res_hi, const __m256i *res_add_const, in store_vertical_filter_output_avx2() argument
664 __m256i res_lo_1 = *res_lo; in store_vertical_filter_output_avx2()
810 __m256i res_lo, res_hi; in warp_vertical_filter_avx2() local
811 filter_src_pixels_vertical_avx2(horz_out, src, coeffs, &res_lo, &res_hi, in warp_vertical_filter_avx2()
813 store_vertical_filter_output_avx2(&res_lo, &res_hi, res_add_const, wt, in warp_vertical_filter_avx2()
860 __m256i res_lo, res_hi; in warp_vertical_filter_gamma0_avx2() local
861 filter_src_pixels_vertical_avx2(horz_out, src, coeffs, &res_lo, &res_hi, in warp_vertical_filter_gamma0_avx2()
863 store_vertical_filter_output_avx2(&res_lo, &res_hi, res_add_const, wt, in warp_vertical_filter_gamma0_avx2()
[all …]
Dconvolve_avx2.c94 const __m256i res_lo = convolve_lowbd_4tap(s, coeffs + 1); in av1_convolve_y_sr_avx2() local
98 _mm256_add_epi16(res_lo, right_shift_const), right_shift); in av1_convolve_y_sr_avx2()
206 const __m256i res_lo = convolve_lowbd(s, coeffs); in av1_convolve_y_sr_avx2() local
211 _mm256_add_epi16(res_lo, right_shift_const), right_shift); in av1_convolve_y_sr_avx2()
Dconvolve_2d_sse2.c188 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_convolve_2d_sr_sse2() local
192 _mm_sra_epi32(_mm_add_epi32(res_lo, sum_round), sum_shift); in av1_convolve_2d_sr_sse2()
402 const __m128i res_lo = _mm_sll_epi16(d16_lo, left_shift); in av1_dist_wtd_convolve_2d_copy_sse2() local
403 const __m128i res_unsigned_lo = _mm_add_epi16(res_lo, offset_const); in av1_dist_wtd_convolve_2d_copy_sse2()
Dwiener_convolve_sse2.c183 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_wiener_convolve_add_src_sse2() local
187 _mm_add_epi32(res_lo, round_const), conv_params->round_1); in av1_wiener_convolve_add_src_sse2()
Dhighbd_wiener_convolve_ssse3.c185 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_ssse3() local
189 _mm_add_epi32(res_lo, round_const), conv_params->round_1); in av1_highbd_wiener_convolve_add_src_ssse3()
Dhighbd_wiener_convolve_avx2.c225 const __m256i res_lo = _mm256_unpacklo_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_avx2() local
229 _mm256_add_epi32(res_lo, round_const), conv_params->round_1); in av1_highbd_wiener_convolve_add_src_avx2()
Djnt_convolve_ssse3.c196 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_ssse3() local
200 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_dist_wtd_convolve_2d_ssse3()
Dhighbd_convolve_2d_sse4.c348 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_2d_sse4_1() local
352 _mm_sra_epi32(_mm_add_epi32(res_lo, round_const), round_shift); in av1_highbd_dist_wtd_convolve_2d_sse4_1()
/external/libaom/libaom/av1/common/arm/
Dwarp_plane_neon.c488 int32x4_t res_lo, res_hi; in av1_warp_affine_neon() local
627 vertical_filter_neon(v_src, &res_lo, &res_hi, sy, gamma); in av1_warp_affine_neon()
629 res_lo = vaddq_s32(res_lo, add_const_vert); in av1_warp_affine_neon()
637 res_lo = vrshlq_s32(res_lo, shift_vert); in av1_warp_affine_neon()
644 res_lo = vmulq_s32(res_lo, bwd); in av1_warp_affine_neon()
646 tmp32_lo = vaddq_s32(tmp32_lo, res_lo); in av1_warp_affine_neon()
649 tmp32_lo = vaddq_s32(tmp32_lo, res_lo); in av1_warp_affine_neon()
659 uint16x4_t res_u16_low = vqmovun_s32(res_lo); in av1_warp_affine_neon()
696 res_lo = vrshlq_s32(res_lo, shift_vert); in av1_warp_affine_neon()
699 result_final = vcombine_s16(vmovn_s32(res_lo), vmovn_s32(res_hi)); in av1_warp_affine_neon()
/external/libaom/libaom/aom_dsp/x86/
Dblend_mask_sse4.h52 __m128i res_lo = _mm_madd_epi16(_mm_unpacklo_epi16(s0, s1), in blend_a64_d16_mask_w8_sse41() local
56 res_lo = _mm_srai_epi32(_mm_sub_epi32(res_lo, *v_round_offset), shift); in blend_a64_d16_mask_w8_sse41()
58 const __m128i res_e = _mm_packs_epi32(res_lo, res_hi); in blend_a64_d16_mask_w8_sse41()
Dconvolve_sse2.h90 const __m128i res_lo = _mm_srai_epi32(wt_res_lo, DIST_PRECISION_BITS); in comp_avg() local
93 res = _mm_packs_epi32(res_lo, res_hi); in comp_avg()
Daom_subpixel_8t_intrin_sse2.c62 __m128i res_lo = _mm_unpacklo_epi32(srcRegFilt32b1_1, srcRegFilt32b1_2); in aom_filter_block1d16_h4_sse2() local
64 srcRegFilt32b1_1 = _mm_packs_epi32(res_lo, res_hi); in aom_filter_block1d16_h4_sse2()
86 res_lo = _mm_unpacklo_epi32(srcRegFilt32b2_1, srcRegFilt32b2_2); in aom_filter_block1d16_h4_sse2()
88 srcRegFilt32b2_1 = _mm_packs_epi32(res_lo, res_hi); in aom_filter_block1d16_h4_sse2()
300 __m128i res_lo = _mm_unpacklo_epi32(srcRegFilt32b1_1, srcRegFilt32b1_2); in aom_filter_block1d8_h4_sse2() local
302 srcRegFilt32b1_1 = _mm_packs_epi32(res_lo, res_hi); in aom_filter_block1d8_h4_sse2()
Dconvolve_avx2.h414 const __m256i res_lo = _mm256_srai_epi32(wt_res_lo, DIST_PRECISION_BITS); in comp_avg() local
417 res = _mm256_packs_epi32(res_lo, res_hi); in comp_avg()
/external/libgav1/libgav1/src/dsp/arm/
Ddistance_weighted_blend_neon.cc109 const int16x8_t res_lo = in DistanceWeightedBlendLarge_NEON() local
118 vcombine_u8(vqmovun_s16(res_lo), vqmovun_s16(res_hi)); in DistanceWeightedBlendLarge_NEON()
/external/mesa3d/src/compiler/nir/
Dnir_lower_int64.c303 nir_ssa_def *res_lo = nir_iadd(b, x_lo, y_lo); in lower_iadd64() local
304 nir_ssa_def *carry = nir_b2i32(b, nir_ult(b, res_lo, x_lo)); in lower_iadd64()
307 return nir_pack_64_2x32_split(b, res_lo, res_hi); in lower_iadd64()
318 nir_ssa_def *res_lo = nir_isub(b, x_lo, y_lo); in lower_isub64() local
322 return nir_pack_64_2x32_split(b, res_lo, res_hi); in lower_isub64()
492 nir_ssa_def *res_lo = nir_ior(b, res_hi, nir_b2i32(b, is_non_zero)); in lower_isign64() local
494 return nir_pack_64_2x32_split(b, res_lo, res_hi); in lower_isign64()
775 nir_ssa_def *res_lo = nir_f2u32(b, nir_frem(b, x, div)); in lower_f2() local
776 nir_ssa_def *res = nir_pack_64_2x32_split(b, res_lo, res_hi); in lower_f2()
/external/libgav1/libgav1/src/dsp/x86/
Ddistance_weighted_blend_sse4.cc139 const __m128i res_lo = in DistanceWeightedBlendLarge_SSE4_1() local
147 StoreUnaligned16(dst + x, _mm_packus_epi16(res_lo, res_hi)); in DistanceWeightedBlendLarge_SSE4_1()
/external/u-boot/drivers/bios_emulator/x86emu/
Dops.c962 u32 res_lo,res_hi; in x86emuOp_imul_word_IMM() local
971 imul_long_direct(&res_lo,&res_hi,(s32)srcval,(s32)imm); in x86emuOp_imul_word_IMM()
972 if ((((res_lo & 0x80000000) == 0) && (res_hi == 0x00000000)) || in x86emuOp_imul_word_IMM()
973 (((res_lo & 0x80000000) != 0) && (res_hi == 0xFFFFFFFF))) { in x86emuOp_imul_word_IMM()
980 *destreg = (u32)res_lo; in x86emuOp_imul_word_IMM()
1007 u32 res_lo,res_hi; in x86emuOp_imul_word_IMM() local
1016 imul_long_direct(&res_lo,&res_hi,(s32)*srcreg,(s32)imm); in x86emuOp_imul_word_IMM()
1017 if ((((res_lo & 0x80000000) == 0) && (res_hi == 0x00000000)) || in x86emuOp_imul_word_IMM()
1018 (((res_lo & 0x80000000) != 0) && (res_hi == 0xFFFFFFFF))) { in x86emuOp_imul_word_IMM()
1025 *destreg = (u32)res_lo; in x86emuOp_imul_word_IMM()
[all …]
Dops2.c732 u32 res_lo,res_hi; in x86emuOp2_imul_R_RM() local
739 imul_long_direct(&res_lo,&res_hi,(s32)*destreg,(s32)srcval); in x86emuOp2_imul_R_RM()
747 *destreg = (u32)res_lo; in x86emuOp2_imul_R_RM()
771 u32 res_lo,res_hi; in x86emuOp2_imul_R_RM() local
777 imul_long_direct(&res_lo,&res_hi,(s32)*destreg,(s32)*srcreg); in x86emuOp2_imul_R_RM()
785 *destreg = (u32)res_lo; in x86emuOp2_imul_R_RM()
Dprim_ops.c1913 void imul_long_direct(u32 *res_lo, u32* res_hi,u32 d, u32 s) in imul_long_direct() argument
1918 *res_lo = (u32)res; in imul_long_direct()
1936 *res_lo = (rlo_hi << 16) | (rlo_lo & 0xFFFF); in imul_long_direct()
1939 d = ~*res_lo; in imul_long_direct()
1941 *res_lo = ~*res_lo+1; in imul_long_direct()
/external/u-boot/drivers/bios_emulator/include/x86emu/
Dprim_ops.h119 void imul_long_direct(u32 *res_lo, u32* res_hi,u32 d, u32 s);

12