Searched refs:yy_loadu_256 (Results 1 – 9 of 9) sorted by relevance
115 const __m256i s0 = yy_loadu_256(src0 + j); in av1_build_compound_diffwtd_mask_avx2()116 const __m256i s1 = yy_loadu_256(src1 + j); in av1_build_compound_diffwtd_mask_avx2()224 const __m256i s0A = yy_loadu_256(src0); in build_compound_diffwtd_mask_d16_avx2()225 const __m256i s0B = yy_loadu_256(src0 + src0_stride); in build_compound_diffwtd_mask_d16_avx2()226 const __m256i s1A = yy_loadu_256(src1); in build_compound_diffwtd_mask_d16_avx2()227 const __m256i s1B = yy_loadu_256(src1 + src1_stride); in build_compound_diffwtd_mask_d16_avx2()241 const __m256i s0A = yy_loadu_256(src0); in build_compound_diffwtd_mask_d16_avx2()242 const __m256i s0B = yy_loadu_256(src0 + 16); in build_compound_diffwtd_mask_d16_avx2()243 const __m256i s1A = yy_loadu_256(src1); in build_compound_diffwtd_mask_d16_avx2()244 const __m256i s1B = yy_loadu_256(src1 + 16); in build_compound_diffwtd_mask_d16_avx2()[all …]
95 const __m256i src_0 = yy_loadu_256(src_ij + 0); in av1_highbd_wiener_convolve_add_src_avx2()96 const __m256i src_1 = yy_loadu_256(src_ij + 1); in av1_highbd_wiener_convolve_add_src_avx2()97 const __m256i src_2 = yy_loadu_256(src_ij + 2); in av1_highbd_wiener_convolve_add_src_avx2()98 const __m256i src_3 = yy_loadu_256(src_ij + 3); in av1_highbd_wiener_convolve_add_src_avx2()99 const __m256i src_4 = yy_loadu_256(src_ij + 4); in av1_highbd_wiener_convolve_add_src_avx2()100 const __m256i src_5 = yy_loadu_256(src_ij + 5); in av1_highbd_wiener_convolve_add_src_avx2()101 const __m256i src_6 = yy_loadu_256(src_ij + 6); in av1_highbd_wiener_convolve_add_src_avx2()102 const __m256i src_7 = yy_loadu_256(src_ij + 7); in av1_highbd_wiener_convolve_add_src_avx2()181 const __m256i data_0 = yy_loadu_256(temp_ij + 0 * MAX_SB_SIZE); in av1_highbd_wiener_convolve_add_src_avx2()182 const __m256i data_1 = yy_loadu_256(temp_ij + 1 * MAX_SB_SIZE); in av1_highbd_wiener_convolve_add_src_avx2()[all …]
181 const __m256i tl = yy_loadu_256(ii - (r + 1) - (r + 1) * stride); in boxsum_from_ii()182 const __m256i tr = yy_loadu_256(ii + (r + 0) - (r + 1) * stride); in boxsum_from_ii()183 const __m256i bl = yy_loadu_256(ii - (r + 1) + r * stride); in boxsum_from_ii()184 const __m256i br = yy_loadu_256(ii + (r + 0) + r * stride); in boxsum_from_ii()303 const __m256i xtl = yy_loadu_256(buf - 1 - stride); in cross_sum()304 const __m256i xt = yy_loadu_256(buf - stride); in cross_sum()305 const __m256i xtr = yy_loadu_256(buf + 1 - stride); in cross_sum()306 const __m256i xl = yy_loadu_256(buf - 1); in cross_sum()307 const __m256i x = yy_loadu_256(buf); in cross_sum()308 const __m256i xr = yy_loadu_256(buf + 1); in cross_sum()[all …]
187 const __m256i data_0 = yy_loadu_256(data_ij + 0 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()188 const __m256i data_1 = yy_loadu_256(data_ij + 1 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()189 const __m256i data_2 = yy_loadu_256(data_ij + 2 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()190 const __m256i data_3 = yy_loadu_256(data_ij + 3 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()191 const __m256i data_4 = yy_loadu_256(data_ij + 4 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()192 const __m256i data_5 = yy_loadu_256(data_ij + 5 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()193 const __m256i data_6 = yy_loadu_256(data_ij + 6 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()194 const __m256i data_7 = yy_loadu_256(data_ij + 7 * MAX_SB_SIZE); in av1_wiener_convolve_add_src_avx2()
43 const __m256i c0 = yy_loadu_256(cf); in av1_txb_init_levels_avx2()44 const __m256i c1 = yy_loadu_256(cf + 8); in av1_txb_init_levels_avx2()56 const __m256i coeffA = yy_loadu_256(cf); in av1_txb_init_levels_avx2()57 const __m256i coeffB = yy_loadu_256(cf + 8); in av1_txb_init_levels_avx2()58 const __m256i coeffC = yy_loadu_256(cf + 16); in av1_txb_init_levels_avx2()59 const __m256i coeffD = yy_loadu_256(cf + 24); in av1_txb_init_levels_avx2()83 const __m256i coeffA = yy_loadu_256(cf); in av1_txb_init_levels_avx2()84 const __m256i coeffB = yy_loadu_256(cf + 8); in av1_txb_init_levels_avx2()85 const __m256i coeffC = yy_loadu_256(cf + 16); in av1_txb_init_levels_avx2()86 const __m256i coeffD = yy_loadu_256(cf + 24); in av1_txb_init_levels_avx2()[all …]
25 const __m256i dst0 = yy_loadu_256(dst); in acc_stat_avx2()148 const __m256i dst0 = yy_loadu_256(dst); in acc_stat_highbd_avx2()154 const __m256i dst1 = yy_loadu_256(dst + 4); in acc_stat_highbd_avx2()224 const __m256i shuffle = yy_loadu_256(g_shuffle_stats_highbd_data); in compute_stats_highbd_win7_opt_avx2()324 const __m256i shuffle = yy_loadu_256(g_shuffle_stats_highbd_data); in compute_stats_highbd_win5_opt_avx2()512 _mm256_packs_epi32(yy_loadu_256(flt0 + j), in av1_lowbd_pixel_proj_error_avx2()513 yy_loadu_256(flt0 + j + 8)), in av1_lowbd_pixel_proj_error_avx2()516 _mm256_packs_epi32(yy_loadu_256(flt1 + j), in av1_lowbd_pixel_proj_error_avx2()517 yy_loadu_256(flt1 + j + 8)), in av1_lowbd_pixel_proj_error_avx2()564 _mm256_packs_epi32(yy_loadu_256(flt + j), in av1_lowbd_pixel_proj_error_avx2()[all …]
33 const __m256i s0_0 = yy_loadu_256(src0); in blend_a64_d16_mask_w16_avx2()34 const __m256i s1_0 = yy_loadu_256(src1); in blend_a64_d16_mask_w16_avx2()55 const __m256i s0_0 = yy_loadu_256(src0); in blend_a64_d16_mask_w32_avx2()56 const __m256i s0_1 = yy_loadu_256(src0 + 16); in blend_a64_d16_mask_w32_avx2()57 const __m256i s1_0 = yy_loadu_256(src1); in blend_a64_d16_mask_w32_avx2()58 const __m256i s1_1 = yy_loadu_256(src1 + 16); in blend_a64_d16_mask_w32_avx2()109 const __m256i m = yy_loadu_256(mask + j); in lowbd_blend_a64_d16_mask_subw0_subh0_w32_avx2()132 const __m256i m_i00 = yy_loadu_256(mask); in lowbd_blend_a64_d16_mask_subw1_subh1_w16_avx2()133 const __m256i m_i10 = yy_loadu_256(mask + mask_stride); in lowbd_blend_a64_d16_mask_subw1_subh1_w16_avx2()158 const __m256i m_i00 = yy_loadu_256(mask + 2 * j); in lowbd_blend_a64_d16_mask_subw1_subh1_w32_avx2()[all …]
22 const __m256i v_a0 = yy_loadu_256(a); in sse_w32_avx2()23 const __m256i v_b0 = yy_loadu_256(b); in sse_w32_avx2()216 const __m256i v_a_w = yy_loadu_256(a); in highbd_sse_w16_avx2()217 const __m256i v_b_w = yy_loadu_256(b); in highbd_sse_w16_avx2()
34 static INLINE __m256i yy_loadu_256(const void *a) { in yy_loadu_256() function