1 /*
2 * Copyright (c) 2010, Google, Inc.
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 /**
22 * @file
23 * AV1 decoder support via libaom
24 */
25
26 #include <aom/aom_decoder.h>
27 #include <aom/aomdx.h>
28
29 #include "libavutil/common.h"
30 #include "libavutil/imgutils.h"
31
32 #include "avcodec.h"
33 #include "internal.h"
34 #include "profiles.h"
35
36 typedef struct AV1DecodeContext {
37 struct aom_codec_ctx decoder;
38 } AV1DecodeContext;
39
aom_init(AVCodecContext * avctx,const struct aom_codec_iface * iface)40 static av_cold int aom_init(AVCodecContext *avctx,
41 const struct aom_codec_iface *iface)
42 {
43 AV1DecodeContext *ctx = avctx->priv_data;
44 struct aom_codec_dec_cfg deccfg = {
45 .threads = FFMIN(avctx->thread_count ? avctx->thread_count : av_cpu_count(), 16)
46 };
47
48 av_log(avctx, AV_LOG_INFO, "%s\n", aom_codec_version_str());
49 av_log(avctx, AV_LOG_VERBOSE, "%s\n", aom_codec_build_config());
50
51 if (aom_codec_dec_init(&ctx->decoder, iface, &deccfg, 0) != AOM_CODEC_OK) {
52 const char *error = aom_codec_error(&ctx->decoder);
53 av_log(avctx, AV_LOG_ERROR, "Failed to initialize decoder: %s\n",
54 error);
55 return AVERROR(EINVAL);
56 }
57
58 return 0;
59 }
60
image_copy_16_to_8(AVFrame * pic,struct aom_image * img)61 static void image_copy_16_to_8(AVFrame *pic, struct aom_image *img)
62 {
63 const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pic->format);
64 int i;
65
66 for (i = 0; i < desc->nb_components; i++) {
67 int w = img->d_w;
68 int h = img->d_h;
69 int x, y;
70
71 if (i) {
72 w = (w + img->x_chroma_shift) >> img->x_chroma_shift;
73 h = (h + img->y_chroma_shift) >> img->y_chroma_shift;
74 }
75
76 for (y = 0; y < h; y++) {
77 uint16_t *src = (uint16_t *)(img->planes[i] + y * img->stride[i]);
78 uint8_t *dst = pic->data[i] + y * pic->linesize[i];
79 for (x = 0; x < w; x++)
80 *dst++ = *src++;
81 }
82 }
83 }
84
85 // returns 0 on success, AVERROR_INVALIDDATA otherwise
set_pix_fmt(AVCodecContext * avctx,struct aom_image * img)86 static int set_pix_fmt(AVCodecContext *avctx, struct aom_image *img)
87 {
88 static const enum AVColorRange color_ranges[] = {
89 AVCOL_RANGE_MPEG, AVCOL_RANGE_JPEG
90 };
91 avctx->color_range = color_ranges[img->range];
92 avctx->color_primaries = img->cp;
93 avctx->colorspace = img->mc;
94 avctx->color_trc = img->tc;
95
96 switch (img->fmt) {
97 case AOM_IMG_FMT_I420:
98 case AOM_IMG_FMT_I42016:
99 if (img->bit_depth == 8) {
100 avctx->pix_fmt = img->monochrome ?
101 AV_PIX_FMT_GRAY8 : AV_PIX_FMT_YUV420P;
102 avctx->profile = FF_PROFILE_AV1_MAIN;
103 return 0;
104 } else if (img->bit_depth == 10) {
105 avctx->pix_fmt = img->monochrome ?
106 AV_PIX_FMT_GRAY10 : AV_PIX_FMT_YUV420P10;
107 avctx->profile = FF_PROFILE_AV1_MAIN;
108 return 0;
109 } else if (img->bit_depth == 12) {
110 avctx->pix_fmt = img->monochrome ?
111 AV_PIX_FMT_GRAY12 : AV_PIX_FMT_YUV420P12;
112 avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
113 return 0;
114 } else {
115 return AVERROR_INVALIDDATA;
116 }
117 case AOM_IMG_FMT_I422:
118 case AOM_IMG_FMT_I42216:
119 if (img->bit_depth == 8) {
120 avctx->pix_fmt = AV_PIX_FMT_YUV422P;
121 avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
122 return 0;
123 } else if (img->bit_depth == 10) {
124 avctx->pix_fmt = AV_PIX_FMT_YUV422P10;
125 avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
126 return 0;
127 } else if (img->bit_depth == 12) {
128 avctx->pix_fmt = AV_PIX_FMT_YUV422P12;
129 avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
130 return 0;
131 } else {
132 return AVERROR_INVALIDDATA;
133 }
134 case AOM_IMG_FMT_I444:
135 case AOM_IMG_FMT_I44416:
136 if (img->bit_depth == 8) {
137 avctx->pix_fmt = AV_PIX_FMT_YUV444P;
138 avctx->profile = FF_PROFILE_AV1_HIGH;
139 return 0;
140 } else if (img->bit_depth == 10) {
141 avctx->pix_fmt = AV_PIX_FMT_YUV444P10;
142 avctx->profile = FF_PROFILE_AV1_HIGH;
143 return 0;
144 } else if (img->bit_depth == 12) {
145 avctx->pix_fmt = AV_PIX_FMT_YUV444P12;
146 avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;
147 return 0;
148 } else {
149 return AVERROR_INVALIDDATA;
150 }
151
152 default:
153 return AVERROR_INVALIDDATA;
154 }
155 }
156
aom_decode(AVCodecContext * avctx,void * data,int * got_frame,AVPacket * avpkt)157 static int aom_decode(AVCodecContext *avctx, void *data, int *got_frame,
158 AVPacket *avpkt)
159 {
160 AV1DecodeContext *ctx = avctx->priv_data;
161 AVFrame *picture = data;
162 const void *iter = NULL;
163 struct aom_image *img;
164 int ret;
165
166 if (aom_codec_decode(&ctx->decoder, avpkt->data, avpkt->size, NULL) !=
167 AOM_CODEC_OK) {
168 const char *error = aom_codec_error(&ctx->decoder);
169 const char *detail = aom_codec_error_detail(&ctx->decoder);
170
171 av_log(avctx, AV_LOG_ERROR, "Failed to decode frame: %s\n", error);
172 if (detail)
173 av_log(avctx, AV_LOG_ERROR, " Additional information: %s\n",
174 detail);
175 return AVERROR_INVALIDDATA;
176 }
177
178 if ((img = aom_codec_get_frame(&ctx->decoder, &iter))) {
179 if (img->d_w > img->w || img->d_h > img->h) {
180 av_log(avctx, AV_LOG_ERROR, "Display dimensions %dx%d exceed storage %dx%d\n",
181 img->d_w, img->d_h, img->w, img->h);
182 return AVERROR_EXTERNAL;
183 }
184
185 if ((ret = set_pix_fmt(avctx, img)) < 0) {
186 av_log(avctx, AV_LOG_ERROR, "Unsupported output colorspace (%d) / bit_depth (%d)\n",
187 img->fmt, img->bit_depth);
188 return ret;
189 }
190
191 if ((int)img->d_w != avctx->width || (int)img->d_h != avctx->height) {
192 av_log(avctx, AV_LOG_INFO, "dimension change! %dx%d -> %dx%d\n",
193 avctx->width, avctx->height, img->d_w, img->d_h);
194 ret = ff_set_dimensions(avctx, img->d_w, img->d_h);
195 if (ret < 0)
196 return ret;
197 }
198 if ((ret = ff_get_buffer(avctx, picture, 0)) < 0)
199 return ret;
200
201 av_reduce(&picture->sample_aspect_ratio.num,
202 &picture->sample_aspect_ratio.den,
203 picture->height * img->r_w,
204 picture->width * img->r_h,
205 INT_MAX);
206 ff_set_sar(avctx, picture->sample_aspect_ratio);
207
208 if ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) && img->bit_depth == 8)
209 image_copy_16_to_8(picture, img);
210 else
211 av_image_copy(picture->data, picture->linesize, (const uint8_t **)img->planes,
212 img->stride, avctx->pix_fmt, img->d_w, img->d_h);
213 *got_frame = 1;
214 }
215 return avpkt->size;
216 }
217
aom_free(AVCodecContext * avctx)218 static av_cold int aom_free(AVCodecContext *avctx)
219 {
220 AV1DecodeContext *ctx = avctx->priv_data;
221 aom_codec_destroy(&ctx->decoder);
222 return 0;
223 }
224
av1_init(AVCodecContext * avctx)225 static av_cold int av1_init(AVCodecContext *avctx)
226 {
227 return aom_init(avctx, &aom_codec_av1_dx_algo);
228 }
229
230 AVCodec ff_libaom_av1_decoder = {
231 .name = "libaom-av1",
232 .long_name = NULL_IF_CONFIG_SMALL("libaom AV1"),
233 .type = AVMEDIA_TYPE_VIDEO,
234 .id = AV_CODEC_ID_AV1,
235 .priv_data_size = sizeof(AV1DecodeContext),
236 .init = av1_init,
237 .close = aom_free,
238 .decode = aom_decode,
239 .capabilities = AV_CODEC_CAP_OTHER_THREADS | AV_CODEC_CAP_DR1,
240 .caps_internal = FF_CODEC_CAP_AUTO_THREADS,
241 .profiles = NULL_IF_CONFIG_SMALL(ff_av1_profiles),
242 .wrapper_name = "libaom",
243 };
244