/external/libaom/libaom/av1/common/x86/ |
D | highbd_inv_txfm_avx2.c | 269 __m256i *bf1, const __m256i *cospim8, const __m256i *cospi56, in idct32_stage4_avx2() argument 274 temp1 = half_btf_avx2(cospim8, &bf1[17], cospi56, &bf1[30], rounding, bit); in idct32_stage4_avx2() 275 bf1[30] = half_btf_avx2(cospi56, &bf1[17], cospi8, &bf1[30], rounding, bit); in idct32_stage4_avx2() 279 bf1[29] = half_btf_avx2(cospim8, &bf1[18], cospi56, &bf1[29], rounding, bit); in idct32_stage4_avx2() 551 const __m256i cospi56 = _mm256_set1_epi32(cospi[56]); in idct32_low8_avx2() local 610 bf1[4] = half_btf_0_avx2(&cospi56, &bf1[4], &rounding, bit); in idct32_low8_avx2() 617 idct32_stage4_avx2(bf1, &cospim8, &cospi56, &cospi8, &cospim56, &cospim40, in idct32_low8_avx2() 676 const __m256i cospi56 = _mm256_set1_epi32(cospi[56]); in idct32_low16_avx2() local 755 bf1[4] = half_btf_0_avx2(&cospi56, &bf1[4], &rounding, bit); in idct32_low16_avx2() 764 idct32_stage4_avx2(bf1, &cospim8, &cospi56, &cospi8, &cospim56, &cospim40, in idct32_low16_avx2() [all …]
|
D | highbd_inv_txfm_sse4.c | 149 __m128i *bf1, const __m128i *cospim8, const __m128i *cospi56, in idct32_stage4_sse4_1() argument 154 temp1 = half_btf_sse4_1(cospim8, &bf1[17], cospi56, &bf1[30], rounding, bit); in idct32_stage4_sse4_1() 155 bf1[30] = half_btf_sse4_1(cospi56, &bf1[17], cospi8, &bf1[30], rounding, bit); in idct32_stage4_sse4_1() 160 half_btf_sse4_1(cospim8, &bf1[18], cospi56, &bf1[29], rounding, bit); in idct32_stage4_sse4_1() 777 const __m128i cospi56 = _mm_set1_epi32(cospi[56]); in idct8x8_sse4_1() local 810 x = _mm_mullo_epi32(in[1 * 2 + col], cospi56); in idct8x8_sse4_1() 817 y = _mm_mullo_epi32(in[7 * 2 + col], cospi56); in idct8x8_sse4_1() 1490 const __m128i cospi56 = _mm_set1_epi32(cospi[56]); in idct8x8_new_sse4_1() local 1516 x = _mm_mullo_epi32(in[1], cospi56); in idct8x8_new_sse4_1() 1523 y = _mm_mullo_epi32(in[7], cospi56); in idct8x8_new_sse4_1() [all …]
|
/external/libaom/libaom/av1/encoder/x86/ |
D | highbd_fwd_txfm_sse4.c | 522 const __m128i cospi56 = _mm_set1_epi32(cospi[56]); in fdct4x8_sse4_1() local 599 v[0] = _mm_mullo_epi32(u[4], cospi56); in fdct4x8_sse4_1() 606 v[1] = _mm_mullo_epi32(u[7], cospi56); in fdct4x8_sse4_1() 1188 const __m128i cospi56 = _mm_set1_epi32(cospi[56]); in fdct16x16_sse4_1() local 1355 u[4] = _mm_mullo_epi32(v[4], cospi56); in fdct16x16_sse4_1() 1362 x = _mm_mullo_epi32(v[7], cospi56); in fdct16x16_sse4_1() 1474 const __m128i cospi56 = _mm_set1_epi32(cospi[56]); in fadst16x16_sse4_1() local 1647 v[8] = half_btf_sse4_1(&cospi8, &u[8], &cospi56, &u[9], &rnding, bit); in fadst16x16_sse4_1() 1648 v[9] = half_btf_sse4_1(&cospi56, &u[8], &cospim8, &u[9], &rnding, bit); in fadst16x16_sse4_1() 1652 v[13] = half_btf_sse4_1(&cospi8, &u[12], &cospi56, &u[13], &rnding, bit); in fadst16x16_sse4_1()
|
D | highbd_fwd_txfm_avx2.c | 263 const __m256i cospi56 = _mm256_set1_epi32(cospi[56]); in av1_fdct8_avx2() local 327 v[0] = _mm256_mullo_epi32(u[4], cospi56); in av1_fdct8_avx2() 334 v[1] = _mm256_mullo_epi32(u[7], cospi56); in av1_fdct8_avx2() 739 const __m256i cospi56 = _mm256_set1_epi32(cospi[56]); in av1_fdct16_avx2() local 906 u[4] = _mm256_mullo_epi32(v[4], cospi56); in av1_fdct16_avx2() 913 x = _mm256_mullo_epi32(v[7], cospi56); in av1_fdct16_avx2() 1024 const __m256i cospi56 = _mm256_set1_epi32(cospi[56]); in av1_fadst16_avx2() local 1199 v[8] = av1_half_btf_avx2(&cospi8, &u[8], &cospi56, &u[9], &rnding, bit); in av1_fadst16_avx2() 1200 v[9] = av1_half_btf_avx2(&cospi56, &u[8], &cospim8, &u[9], &rnding, bit); in av1_fadst16_avx2() 1205 v[13] = av1_half_btf_avx2(&cospi8, &u[12], &cospi56, &u[13], &rnding, bit); in av1_fadst16_avx2()
|