1 /*
2 * VP9 compatible video decoder
3 *
4 * Copyright (C) 2013 Ronald S. Bultje <rsbultje gmail com>
5 * Copyright (C) 2013 Clément Bœsch <u pkh me>
6 *
7 * This file is part of FFmpeg.
8 *
9 * FFmpeg is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * FFmpeg is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with FFmpeg; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 */
23
24 #include "config.h"
25
26 #include "libavutil/attributes.h"
27 #include "libavutil/avassert.h"
28 #include "libavutil/mem_internal.h"
29
30 #include "vp9dsp.h"
31
32 const DECLARE_ALIGNED(16, int16_t, ff_vp9_subpel_filters)[3][16][8] = {
33 [FILTER_8TAP_REGULAR] = {
34 { 0, 0, 0, 128, 0, 0, 0, 0 },
35 { 0, 1, -5, 126, 8, -3, 1, 0 },
36 { -1, 3, -10, 122, 18, -6, 2, 0 },
37 { -1, 4, -13, 118, 27, -9, 3, -1 },
38 { -1, 4, -16, 112, 37, -11, 4, -1 },
39 { -1, 5, -18, 105, 48, -14, 4, -1 },
40 { -1, 5, -19, 97, 58, -16, 5, -1 },
41 { -1, 6, -19, 88, 68, -18, 5, -1 },
42 { -1, 6, -19, 78, 78, -19, 6, -1 },
43 { -1, 5, -18, 68, 88, -19, 6, -1 },
44 { -1, 5, -16, 58, 97, -19, 5, -1 },
45 { -1, 4, -14, 48, 105, -18, 5, -1 },
46 { -1, 4, -11, 37, 112, -16, 4, -1 },
47 { -1, 3, -9, 27, 118, -13, 4, -1 },
48 { 0, 2, -6, 18, 122, -10, 3, -1 },
49 { 0, 1, -3, 8, 126, -5, 1, 0 },
50 }, [FILTER_8TAP_SHARP] = {
51 { 0, 0, 0, 128, 0, 0, 0, 0 },
52 { -1, 3, -7, 127, 8, -3, 1, 0 },
53 { -2, 5, -13, 125, 17, -6, 3, -1 },
54 { -3, 7, -17, 121, 27, -10, 5, -2 },
55 { -4, 9, -20, 115, 37, -13, 6, -2 },
56 { -4, 10, -23, 108, 48, -16, 8, -3 },
57 { -4, 10, -24, 100, 59, -19, 9, -3 },
58 { -4, 11, -24, 90, 70, -21, 10, -4 },
59 { -4, 11, -23, 80, 80, -23, 11, -4 },
60 { -4, 10, -21, 70, 90, -24, 11, -4 },
61 { -3, 9, -19, 59, 100, -24, 10, -4 },
62 { -3, 8, -16, 48, 108, -23, 10, -4 },
63 { -2, 6, -13, 37, 115, -20, 9, -4 },
64 { -2, 5, -10, 27, 121, -17, 7, -3 },
65 { -1, 3, -6, 17, 125, -13, 5, -2 },
66 { 0, 1, -3, 8, 127, -7, 3, -1 },
67 }, [FILTER_8TAP_SMOOTH] = {
68 { 0, 0, 0, 128, 0, 0, 0, 0 },
69 { -3, -1, 32, 64, 38, 1, -3, 0 },
70 { -2, -2, 29, 63, 41, 2, -3, 0 },
71 { -2, -2, 26, 63, 43, 4, -4, 0 },
72 { -2, -3, 24, 62, 46, 5, -4, 0 },
73 { -2, -3, 21, 60, 49, 7, -4, 0 },
74 { -1, -4, 18, 59, 51, 9, -4, 0 },
75 { -1, -4, 16, 57, 53, 12, -4, -1 },
76 { -1, -4, 14, 55, 55, 14, -4, -1 },
77 { -1, -4, 12, 53, 57, 16, -4, -1 },
78 { 0, -4, 9, 51, 59, 18, -4, -1 },
79 { 0, -4, 7, 49, 60, 21, -3, -2 },
80 { 0, -4, 5, 46, 62, 24, -3, -2 },
81 { 0, -4, 4, 43, 63, 26, -2, -2 },
82 { 0, -3, 2, 41, 63, 29, -2, -2 },
83 { 0, -3, 1, 38, 64, 32, -1, -3 },
84 }
85 };
86
87
ff_vp9dsp_init(VP9DSPContext * dsp,int bpp,int bitexact)88 av_cold void ff_vp9dsp_init(VP9DSPContext *dsp, int bpp, int bitexact)
89 {
90 if (bpp == 8) {
91 ff_vp9dsp_init_8(dsp);
92 } else if (bpp == 10) {
93 ff_vp9dsp_init_10(dsp);
94 } else {
95 av_assert0(bpp == 12);
96 ff_vp9dsp_init_12(dsp);
97 }
98
99 #if ARCH_AARCH64
100 ff_vp9dsp_init_aarch64(dsp, bpp);
101 #elif ARCH_ARM
102 ff_vp9dsp_init_arm(dsp, bpp);
103 #elif ARCH_X86
104 ff_vp9dsp_init_x86(dsp, bpp, bitexact);
105 #elif ARCH_MIPS
106 ff_vp9dsp_init_mips(dsp, bpp);
107 #elif ARCH_LOONGARCH
108 ff_vp9dsp_init_loongarch(dsp, bpp);
109 #endif
110 }
111