1 /*
2 * thirdpel DSP functions
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 /**
22 * @file
23 * thirdpel DSP functions
24 */
25
26 #include <stdint.h>
27
28 #include "libavutil/attributes.h"
29 #include "tpeldsp.h"
30
31 #define BIT_DEPTH 8
32 #include "pel_template.c"
33
put_tpel_pixels_mc00_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)34 static inline void put_tpel_pixels_mc00_c(uint8_t *dst, const uint8_t *src,
35 int stride, int width, int height)
36 {
37 switch (width) {
38 case 2:
39 put_pixels2_8_c(dst, src, stride, height);
40 break;
41 case 4:
42 put_pixels4_8_c(dst, src, stride, height);
43 break;
44 case 8:
45 put_pixels8_8_c(dst, src, stride, height);
46 break;
47 case 16:
48 put_pixels16_8_c(dst, src, stride, height);
49 break;
50 }
51 }
52
put_tpel_pixels_mc10_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)53 static inline void put_tpel_pixels_mc10_c(uint8_t *dst, const uint8_t *src,
54 int stride, int width, int height)
55 {
56 int i, j;
57
58 for (i = 0; i < height; i++) {
59 for (j = 0; j < width; j++)
60 dst[j] = ((2 * src[j] + src[j + 1] + 1) *
61 683) >> 11;
62 src += stride;
63 dst += stride;
64 }
65 }
66
put_tpel_pixels_mc20_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)67 static inline void put_tpel_pixels_mc20_c(uint8_t *dst, const uint8_t *src,
68 int stride, int width, int height)
69 {
70 int i, j;
71
72 for (i = 0; i < height; i++) {
73 for (j = 0; j < width; j++)
74 dst[j] = ((src[j] + 2 * src[j + 1] + 1) *
75 683) >> 11;
76 src += stride;
77 dst += stride;
78 }
79 }
80
put_tpel_pixels_mc01_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)81 static inline void put_tpel_pixels_mc01_c(uint8_t *dst, const uint8_t *src,
82 int stride, int width, int height)
83 {
84 int i, j;
85
86 for (i = 0; i < height; i++) {
87 for (j = 0; j < width; j++)
88 dst[j] = ((2 * src[j] + src[j + stride] + 1) *
89 683) >> 11;
90 src += stride;
91 dst += stride;
92 }
93 }
94
put_tpel_pixels_mc11_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)95 static inline void put_tpel_pixels_mc11_c(uint8_t *dst, const uint8_t *src,
96 int stride, int width, int height)
97 {
98 int i, j;
99
100 for (i = 0; i < height; i++) {
101 for (j = 0; j < width; j++)
102 dst[j] = ((4 * src[j] + 3 * src[j + 1] +
103 3 * src[j + stride] + 2 * src[j + stride + 1] + 6) *
104 2731) >> 15;
105 src += stride;
106 dst += stride;
107 }
108 }
109
put_tpel_pixels_mc12_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)110 static inline void put_tpel_pixels_mc12_c(uint8_t *dst, const uint8_t *src,
111 int stride, int width, int height)
112 {
113 int i, j;
114
115 for (i = 0; i < height; i++) {
116 for (j = 0; j < width; j++)
117 dst[j] = ((3 * src[j] + 2 * src[j + 1] +
118 4 * src[j + stride] + 3 * src[j + stride + 1] + 6) *
119 2731) >> 15;
120 src += stride;
121 dst += stride;
122 }
123 }
124
put_tpel_pixels_mc02_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)125 static inline void put_tpel_pixels_mc02_c(uint8_t *dst, const uint8_t *src,
126 int stride, int width, int height)
127 {
128 int i, j;
129
130 for (i = 0; i < height; i++) {
131 for (j = 0; j < width; j++)
132 dst[j] = ((src[j] + 2 * src[j + stride] + 1) *
133 683) >> 11;
134 src += stride;
135 dst += stride;
136 }
137 }
138
put_tpel_pixels_mc21_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)139 static inline void put_tpel_pixels_mc21_c(uint8_t *dst, const uint8_t *src,
140 int stride, int width, int height)
141 {
142 int i, j;
143
144 for (i = 0; i < height; i++) {
145 for (j = 0; j < width; j++)
146 dst[j] = ((3 * src[j] + 4 * src[j + 1] +
147 2 * src[j + stride] + 3 * src[j + stride + 1] + 6) *
148 2731) >> 15;
149 src += stride;
150 dst += stride;
151 }
152 }
153
put_tpel_pixels_mc22_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)154 static inline void put_tpel_pixels_mc22_c(uint8_t *dst, const uint8_t *src,
155 int stride, int width, int height)
156 {
157 int i, j;
158
159 for (i = 0; i < height; i++) {
160 for (j = 0; j < width; j++)
161 dst[j] = ((2 * src[j] + 3 * src[j + 1] +
162 3 * src[j + stride] + 4 * src[j + stride + 1] + 6) *
163 2731) >> 15;
164 src += stride;
165 dst += stride;
166 }
167 }
168
avg_tpel_pixels_mc00_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)169 static inline void avg_tpel_pixels_mc00_c(uint8_t *dst, const uint8_t *src,
170 int stride, int width, int height)
171 {
172 switch (width) {
173 case 2:
174 avg_pixels2_8_c(dst, src, stride, height);
175 break;
176 case 4:
177 avg_pixels4_8_c(dst, src, stride, height);
178 break;
179 case 8:
180 avg_pixels8_8_c(dst, src, stride, height);
181 break;
182 case 16:
183 avg_pixels16_8_c(dst, src, stride, height);
184 break;
185 }
186 }
187
avg_tpel_pixels_mc10_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)188 static inline void avg_tpel_pixels_mc10_c(uint8_t *dst, const uint8_t *src,
189 int stride, int width, int height)
190 {
191 int i, j;
192
193 for (i = 0; i < height; i++) {
194 for (j = 0; j < width; j++)
195 dst[j] = (dst[j] +
196 (((2 * src[j] + src[j + 1] + 1) *
197 683) >> 11) + 1) >> 1;
198 src += stride;
199 dst += stride;
200 }
201 }
202
avg_tpel_pixels_mc20_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)203 static inline void avg_tpel_pixels_mc20_c(uint8_t *dst, const uint8_t *src,
204 int stride, int width, int height)
205 {
206 int i, j;
207
208 for (i = 0; i < height; i++) {
209 for (j = 0; j < width; j++)
210 dst[j] = (dst[j] +
211 (((src[j] + 2 * src[j + 1] + 1) *
212 683) >> 11) + 1) >> 1;
213 src += stride;
214 dst += stride;
215 }
216 }
217
avg_tpel_pixels_mc01_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)218 static inline void avg_tpel_pixels_mc01_c(uint8_t *dst, const uint8_t *src,
219 int stride, int width, int height)
220 {
221 int i, j;
222
223 for (i = 0; i < height; i++) {
224 for (j = 0; j < width; j++)
225 dst[j] = (dst[j] +
226 (((2 * src[j] + src[j + stride] + 1) *
227 683) >> 11) + 1) >> 1;
228 src += stride;
229 dst += stride;
230 }
231 }
232
avg_tpel_pixels_mc11_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)233 static inline void avg_tpel_pixels_mc11_c(uint8_t *dst, const uint8_t *src,
234 int stride, int width, int height)
235 {
236 int i, j;
237
238 for (i = 0; i < height; i++) {
239 for (j = 0; j < width; j++)
240 dst[j] = (dst[j] +
241 (((4 * src[j] + 3 * src[j + 1] +
242 3 * src[j + stride] + 2 * src[j + stride + 1] + 6) *
243 2731) >> 15) + 1) >> 1;
244 src += stride;
245 dst += stride;
246 }
247 }
248
avg_tpel_pixels_mc12_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)249 static inline void avg_tpel_pixels_mc12_c(uint8_t *dst, const uint8_t *src,
250 int stride, int width, int height)
251 {
252 int i, j;
253
254 for (i = 0; i < height; i++) {
255 for (j = 0; j < width; j++)
256 dst[j] = (dst[j] +
257 (((3 * src[j] + 2 * src[j + 1] +
258 4 * src[j + stride] + 3 * src[j + stride + 1] + 6) *
259 2731) >> 15) + 1) >> 1;
260 src += stride;
261 dst += stride;
262 }
263 }
264
avg_tpel_pixels_mc02_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)265 static inline void avg_tpel_pixels_mc02_c(uint8_t *dst, const uint8_t *src,
266 int stride, int width, int height)
267 {
268 int i, j;
269
270 for (i = 0; i < height; i++) {
271 for (j = 0; j < width; j++)
272 dst[j] = (dst[j] +
273 (((src[j] + 2 * src[j + stride] + 1) *
274 683) >> 11) + 1) >> 1;
275 src += stride;
276 dst += stride;
277 }
278 }
279
avg_tpel_pixels_mc21_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)280 static inline void avg_tpel_pixels_mc21_c(uint8_t *dst, const uint8_t *src,
281 int stride, int width, int height)
282 {
283 int i, j;
284
285 for (i = 0; i < height; i++) {
286 for (j = 0; j < width; j++)
287 dst[j] = (dst[j] +
288 (((3 * src[j] + 4 * src[j + 1] +
289 2 * src[j + stride] + 3 * src[j + stride + 1] + 6) *
290 2731) >> 15) + 1) >> 1;
291 src += stride;
292 dst += stride;
293 }
294 }
295
avg_tpel_pixels_mc22_c(uint8_t * dst,const uint8_t * src,int stride,int width,int height)296 static inline void avg_tpel_pixels_mc22_c(uint8_t *dst, const uint8_t *src,
297 int stride, int width, int height)
298 {
299 int i, j;
300
301 for (i = 0; i < height; i++) {
302 for (j = 0; j < width; j++)
303 dst[j] = (dst[j] +
304 (((2 * src[j] + 3 * src[j + 1] +
305 3 * src[j + stride] + 4 * src[j + stride + 1] + 6) *
306 2731) >> 15) + 1) >> 1;
307 src += stride;
308 dst += stride;
309 }
310 }
311
ff_tpeldsp_init(TpelDSPContext * c)312 av_cold void ff_tpeldsp_init(TpelDSPContext *c)
313 {
314 c->put_tpel_pixels_tab[ 0] = put_tpel_pixels_mc00_c;
315 c->put_tpel_pixels_tab[ 1] = put_tpel_pixels_mc10_c;
316 c->put_tpel_pixels_tab[ 2] = put_tpel_pixels_mc20_c;
317 c->put_tpel_pixels_tab[ 4] = put_tpel_pixels_mc01_c;
318 c->put_tpel_pixels_tab[ 5] = put_tpel_pixels_mc11_c;
319 c->put_tpel_pixels_tab[ 6] = put_tpel_pixels_mc21_c;
320 c->put_tpel_pixels_tab[ 8] = put_tpel_pixels_mc02_c;
321 c->put_tpel_pixels_tab[ 9] = put_tpel_pixels_mc12_c;
322 c->put_tpel_pixels_tab[10] = put_tpel_pixels_mc22_c;
323
324 c->avg_tpel_pixels_tab[ 0] = avg_tpel_pixels_mc00_c;
325 c->avg_tpel_pixels_tab[ 1] = avg_tpel_pixels_mc10_c;
326 c->avg_tpel_pixels_tab[ 2] = avg_tpel_pixels_mc20_c;
327 c->avg_tpel_pixels_tab[ 4] = avg_tpel_pixels_mc01_c;
328 c->avg_tpel_pixels_tab[ 5] = avg_tpel_pixels_mc11_c;
329 c->avg_tpel_pixels_tab[ 6] = avg_tpel_pixels_mc21_c;
330 c->avg_tpel_pixels_tab[ 8] = avg_tpel_pixels_mc02_c;
331 c->avg_tpel_pixels_tab[ 9] = avg_tpel_pixels_mc12_c;
332 c->avg_tpel_pixels_tab[10] = avg_tpel_pixels_mc22_c;
333 }
334