/external/libaom/libaom/av1/common/x86/ |
D | highbd_inv_txfm_avx2.c | 270 const __m256i *cospi8, const __m256i *cospim56, const __m256i *cospim40, in idct32_stage4_avx2() argument 275 bf1[30] = half_btf_avx2(cospi56, &bf1[17], cospi8, &bf1[30], rounding, bit); in idct32_stage4_avx2() 554 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in idct32_low8_avx2() local 609 bf1[7] = half_btf_0_avx2(&cospi8, &bf1[4], &rounding, bit); in idct32_low8_avx2() 617 idct32_stage4_avx2(bf1, &cospim8, &cospi56, &cospi8, &cospim56, &cospim40, in idct32_low8_avx2() 679 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in idct32_low16_avx2() local 754 bf1[7] = half_btf_0_avx2(&cospi8, &bf1[4], &rounding, bit); in idct32_low16_avx2() 764 idct32_stage4_avx2(bf1, &cospim8, &cospi56, &cospi8, &cospim56, &cospim40, in idct32_low16_avx2() 841 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in idct32_avx2() local 990 bf0[7] = half_btf_avx2(&cospi8, &bf1[4], &cospi56, &bf1[7], &rounding, bit); in idct32_avx2() [all …]
|
D | highbd_inv_txfm_sse4.c | 150 const __m128i *cospi8, const __m128i *cospim56, const __m128i *cospim40, in idct32_stage4_sse4_1() argument 155 bf1[30] = half_btf_sse4_1(cospi56, &bf1[17], cospi8, &bf1[30], rounding, bit); in idct32_stage4_sse4_1() 782 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in idct8x8_sse4_1() local 816 x = _mm_mullo_epi32(in[1 * 2 + col], cospi8); in idct8x8_sse4_1() 1495 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in idct8x8_new_sse4_1() local 1522 x = _mm_mullo_epi32(in[1], cospi8); in idct8x8_new_sse4_1() 1934 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in idct16x16_low8_sse4_1() local 1974 u[7] = half_btf_0_sse4_1(&cospi8, &u[4], &rnding, bit); in idct16x16_low8_sse4_1() 2089 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in iadst16x16_low1_sse4_1() local 2117 temp1 = _mm_mullo_epi32(v[8], cospi8); in iadst16x16_low1_sse4_1() [all …]
|
/external/libaom/libaom/av1/encoder/x86/ |
D | highbd_fwd_txfm_sse4.c | 523 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in fdct4x8_sse4_1() local 600 v[1] = _mm_mullo_epi32(u[7], cospi8); in fdct4x8_sse4_1() 605 v[0] = _mm_mullo_epi32(u[4], cospi8); in fdct4x8_sse4_1() 1189 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in fdct16x16_sse4_1() local 1356 x = _mm_mullo_epi32(v[7], cospi8); in fdct16x16_sse4_1() 1361 u[7] = _mm_mullo_epi32(v[4], cospi8); in fdct16x16_sse4_1() 1473 const __m128i cospi8 = _mm_set1_epi32(cospi[8]); in fadst16x16_sse4_1() local 1647 v[8] = half_btf_sse4_1(&cospi8, &u[8], &cospi56, &u[9], &rnding, bit); in fadst16x16_sse4_1() 1651 v[12] = half_btf_sse4_1(&cospim56, &u[12], &cospi8, &u[13], &rnding, bit); in fadst16x16_sse4_1() 1652 v[13] = half_btf_sse4_1(&cospi8, &u[12], &cospi56, &u[13], &rnding, bit); in fadst16x16_sse4_1()
|
D | highbd_fwd_txfm_avx2.c | 264 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in av1_fdct8_avx2() local 328 v[1] = _mm256_mullo_epi32(u[7], cospi8); in av1_fdct8_avx2() 333 v[0] = _mm256_mullo_epi32(u[4], cospi8); in av1_fdct8_avx2() 740 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in av1_fdct16_avx2() local 907 x = _mm256_mullo_epi32(v[7], cospi8); in av1_fdct16_avx2() 912 u[7] = _mm256_mullo_epi32(v[4], cospi8); in av1_fdct16_avx2() 1023 const __m256i cospi8 = _mm256_set1_epi32(cospi[8]); in av1_fadst16_avx2() local 1199 v[8] = av1_half_btf_avx2(&cospi8, &u[8], &cospi56, &u[9], &rnding, bit); in av1_fadst16_avx2() 1204 v[12] = av1_half_btf_avx2(&cospim56, &u[12], &cospi8, &u[13], &rnding, bit); in av1_fadst16_avx2() 1205 v[13] = av1_half_btf_avx2(&cospi8, &u[12], &cospi56, &u[13], &rnding, bit); in av1_fadst16_avx2()
|