1 /*
2 * MPEG-2 HW acceleration.
3 *
4 * copyright (c) 2010 Laurent Aimar
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23 #include "libavutil/log.h"
24
25 #include "dxva2_internal.h"
26 #include "mpegutils.h"
27 #include "mpegvideo.h"
28
29 #define MAX_SLICES 1024
30 struct dxva2_picture_context {
31 DXVA_PictureParameters pp;
32 DXVA_QmatrixData qm;
33 unsigned slice_count;
34 DXVA_SliceInfo slice[MAX_SLICES];
35
36 const uint8_t *bitstream;
37 unsigned bitstream_size;
38 };
39
fill_picture_parameters(AVCodecContext * avctx,AVDXVAContext * ctx,const struct MpegEncContext * s,DXVA_PictureParameters * pp)40 static void fill_picture_parameters(AVCodecContext *avctx,
41 AVDXVAContext *ctx,
42 const struct MpegEncContext *s,
43 DXVA_PictureParameters *pp)
44 {
45 const Picture *current_picture = s->current_picture_ptr;
46 int is_field = s->picture_structure != PICT_FRAME;
47
48 memset(pp, 0, sizeof(*pp));
49 pp->wDecodedPictureIndex = ff_dxva2_get_surface_index(avctx, ctx, current_picture->f);
50 pp->wDeblockedPictureIndex = 0;
51 if (s->pict_type != AV_PICTURE_TYPE_I)
52 pp->wForwardRefPictureIndex = ff_dxva2_get_surface_index(avctx, ctx, s->last_picture.f);
53 else
54 pp->wForwardRefPictureIndex = 0xffff;
55 if (s->pict_type == AV_PICTURE_TYPE_B)
56 pp->wBackwardRefPictureIndex = ff_dxva2_get_surface_index(avctx, ctx, s->next_picture.f);
57 else
58 pp->wBackwardRefPictureIndex = 0xffff;
59 pp->wPicWidthInMBminus1 = s->mb_width - 1;
60 pp->wPicHeightInMBminus1 = (s->mb_height >> is_field) - 1;
61 pp->bMacroblockWidthMinus1 = 15;
62 pp->bMacroblockHeightMinus1 = 15;
63 pp->bBlockWidthMinus1 = 7;
64 pp->bBlockHeightMinus1 = 7;
65 pp->bBPPminus1 = 7;
66 pp->bPicStructure = s->picture_structure;
67 pp->bSecondField = is_field && !s->first_field;
68 pp->bPicIntra = s->pict_type == AV_PICTURE_TYPE_I;
69 pp->bPicBackwardPrediction = s->pict_type == AV_PICTURE_TYPE_B;
70 pp->bBidirectionalAveragingMode = 0;
71 pp->bMVprecisionAndChromaRelation= 0; /* FIXME */
72 pp->bChromaFormat = s->chroma_format;
73 pp->bPicScanFixed = 1;
74 pp->bPicScanMethod = s->alternate_scan ? 1 : 0;
75 pp->bPicReadbackRequests = 0;
76 pp->bRcontrol = 0;
77 pp->bPicSpatialResid8 = 0;
78 pp->bPicOverflowBlocks = 0;
79 pp->bPicExtrapolation = 0;
80 pp->bPicDeblocked = 0;
81 pp->bPicDeblockConfined = 0;
82 pp->bPic4MVallowed = 0;
83 pp->bPicOBMC = 0;
84 pp->bPicBinPB = 0;
85 pp->bMV_RPS = 0;
86 pp->bReservedBits = 0;
87 pp->wBitstreamFcodes = (s->mpeg_f_code[0][0] << 12) |
88 (s->mpeg_f_code[0][1] << 8) |
89 (s->mpeg_f_code[1][0] << 4) |
90 (s->mpeg_f_code[1][1] );
91 pp->wBitstreamPCEelements = (s->intra_dc_precision << 14) |
92 (s->picture_structure << 12) |
93 (s->top_field_first << 11) |
94 (s->frame_pred_frame_dct << 10) |
95 (s->concealment_motion_vectors << 9) |
96 (s->q_scale_type << 8) |
97 (s->intra_vlc_format << 7) |
98 (s->alternate_scan << 6) |
99 (s->repeat_first_field << 5) |
100 (s->chroma_420_type << 4) |
101 (s->progressive_frame << 3);
102 pp->bBitstreamConcealmentNeed = 0;
103 pp->bBitstreamConcealmentMethod = 0;
104 }
105
fill_quantization_matrices(AVCodecContext * avctx,AVDXVAContext * ctx,const struct MpegEncContext * s,DXVA_QmatrixData * qm)106 static void fill_quantization_matrices(AVCodecContext *avctx,
107 AVDXVAContext *ctx,
108 const struct MpegEncContext *s,
109 DXVA_QmatrixData *qm)
110 {
111 int i;
112 for (i = 0; i < 4; i++)
113 qm->bNewQmatrix[i] = 1;
114 for (i = 0; i < 64; i++) {
115 int n = s->idsp.idct_permutation[ff_zigzag_direct[i]];
116 qm->Qmatrix[0][i] = s->intra_matrix[n];
117 qm->Qmatrix[1][i] = s->inter_matrix[n];
118 qm->Qmatrix[2][i] = s->chroma_intra_matrix[n];
119 qm->Qmatrix[3][i] = s->chroma_inter_matrix[n];
120 }
121 }
122
fill_slice(AVCodecContext * avctx,const struct MpegEncContext * s,DXVA_SliceInfo * slice,unsigned position,const uint8_t * buffer,unsigned size)123 static void fill_slice(AVCodecContext *avctx,
124 const struct MpegEncContext *s,
125 DXVA_SliceInfo *slice,
126 unsigned position,
127 const uint8_t *buffer, unsigned size)
128 {
129 int is_field = s->picture_structure != PICT_FRAME;
130 GetBitContext gb;
131
132 memset(slice, 0, sizeof(*slice));
133 slice->wHorizontalPosition = s->mb_x;
134 slice->wVerticalPosition = s->mb_y >> is_field;
135 slice->dwSliceBitsInBuffer = 8 * size;
136 slice->dwSliceDataLocation = position;
137 slice->bStartCodeBitOffset = 0;
138 slice->bReservedBits = 0;
139 /* XXX We store the index of the first MB and it will be fixed later */
140 slice->wNumberMBsInSlice = (s->mb_y >> is_field) * s->mb_width + s->mb_x;
141 slice->wBadSliceChopping = 0;
142
143 init_get_bits(&gb, &buffer[4], 8 * (size - 4));
144
145 slice->wQuantizerScaleCode = get_bits(&gb, 5);
146 skip_1stop_8data_bits(&gb);
147
148 slice->wMBbitOffset = 4 * 8 + get_bits_count(&gb);
149 }
commit_bitstream_and_slice_buffer(AVCodecContext * avctx,DECODER_BUFFER_DESC * bs,DECODER_BUFFER_DESC * sc)150 static int commit_bitstream_and_slice_buffer(AVCodecContext *avctx,
151 DECODER_BUFFER_DESC *bs,
152 DECODER_BUFFER_DESC *sc)
153 {
154 const struct MpegEncContext *s = avctx->priv_data;
155 AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
156 struct dxva2_picture_context *ctx_pic =
157 s->current_picture_ptr->hwaccel_picture_private;
158 const int is_field = s->picture_structure != PICT_FRAME;
159 const unsigned mb_count = s->mb_width * (s->mb_height >> is_field);
160 void *dxva_data_ptr;
161 uint8_t *dxva_data, *current, *end;
162 unsigned dxva_size;
163 unsigned i;
164 unsigned type;
165
166 #if CONFIG_D3D11VA
167 if (ff_dxva2_is_d3d11(avctx)) {
168 type = D3D11_VIDEO_DECODER_BUFFER_BITSTREAM;
169 if (FAILED(ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context,
170 D3D11VA_CONTEXT(ctx)->decoder,
171 type,
172 &dxva_size, &dxva_data_ptr)))
173 return -1;
174 }
175 #endif
176 #if CONFIG_DXVA2
177 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
178 type = DXVA2_BitStreamDateBufferType;
179 if (FAILED(IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder,
180 type,
181 &dxva_data_ptr, &dxva_size)))
182 return -1;
183 }
184 #endif
185
186 dxva_data = dxva_data_ptr;
187 current = dxva_data;
188 end = dxva_data + dxva_size;
189
190 for (i = 0; i < ctx_pic->slice_count; i++) {
191 DXVA_SliceInfo *slice = &ctx_pic->slice[i];
192 unsigned position = slice->dwSliceDataLocation;
193 unsigned size = slice->dwSliceBitsInBuffer / 8;
194 if (size > end - current) {
195 av_log(avctx, AV_LOG_ERROR, "Failed to build bitstream");
196 break;
197 }
198 slice->dwSliceDataLocation = current - dxva_data;
199
200 if (i < ctx_pic->slice_count - 1)
201 slice->wNumberMBsInSlice =
202 slice[1].wNumberMBsInSlice - slice[0].wNumberMBsInSlice;
203 else
204 slice->wNumberMBsInSlice =
205 mb_count - slice[0].wNumberMBsInSlice;
206
207 memcpy(current, &ctx_pic->bitstream[position], size);
208 current += size;
209 }
210 #if CONFIG_D3D11VA
211 if (ff_dxva2_is_d3d11(avctx))
212 if (FAILED(ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type)))
213 return -1;
214 #endif
215 #if CONFIG_DXVA2
216 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
217 if (FAILED(IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type)))
218 return -1;
219 #endif
220 if (i < ctx_pic->slice_count)
221 return -1;
222
223 #if CONFIG_D3D11VA
224 if (ff_dxva2_is_d3d11(avctx)) {
225 D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = bs;
226 memset(dsc11, 0, sizeof(*dsc11));
227 dsc11->BufferType = type;
228 dsc11->DataSize = current - dxva_data;
229 dsc11->NumMBsInBuffer = mb_count;
230
231 type = D3D11_VIDEO_DECODER_BUFFER_SLICE_CONTROL;
232 }
233 #endif
234 #if CONFIG_DXVA2
235 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
236 DXVA2_DecodeBufferDesc *dsc2 = bs;
237 memset(dsc2, 0, sizeof(*dsc2));
238 dsc2->CompressedBufferType = type;
239 dsc2->DataSize = current - dxva_data;
240 dsc2->NumMBsInBuffer = mb_count;
241
242 type = DXVA2_SliceControlBufferType;
243 }
244 #endif
245
246 return ff_dxva2_commit_buffer(avctx, ctx, sc,
247 type,
248 ctx_pic->slice,
249 ctx_pic->slice_count * sizeof(*ctx_pic->slice),
250 mb_count);
251 }
252
dxva2_mpeg2_start_frame(AVCodecContext * avctx,av_unused const uint8_t * buffer,av_unused uint32_t size)253 static int dxva2_mpeg2_start_frame(AVCodecContext *avctx,
254 av_unused const uint8_t *buffer,
255 av_unused uint32_t size)
256 {
257 const struct MpegEncContext *s = avctx->priv_data;
258 AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
259 struct dxva2_picture_context *ctx_pic =
260 s->current_picture_ptr->hwaccel_picture_private;
261
262 if (!DXVA_CONTEXT_VALID(avctx, ctx))
263 return -1;
264 assert(ctx_pic);
265
266 fill_picture_parameters(avctx, ctx, s, &ctx_pic->pp);
267 fill_quantization_matrices(avctx, ctx, s, &ctx_pic->qm);
268
269 ctx_pic->slice_count = 0;
270 ctx_pic->bitstream_size = 0;
271 ctx_pic->bitstream = NULL;
272 return 0;
273 }
274
dxva2_mpeg2_decode_slice(AVCodecContext * avctx,const uint8_t * buffer,uint32_t size)275 static int dxva2_mpeg2_decode_slice(AVCodecContext *avctx,
276 const uint8_t *buffer, uint32_t size)
277 {
278 const struct MpegEncContext *s = avctx->priv_data;
279 struct dxva2_picture_context *ctx_pic =
280 s->current_picture_ptr->hwaccel_picture_private;
281 unsigned position;
282
283 if (ctx_pic->slice_count >= MAX_SLICES) {
284 avpriv_request_sample(avctx, "%d slices in dxva2",
285 ctx_pic->slice_count);
286 return -1;
287 }
288 if (!ctx_pic->bitstream)
289 ctx_pic->bitstream = buffer;
290 ctx_pic->bitstream_size += size;
291
292 position = buffer - ctx_pic->bitstream;
293 fill_slice(avctx, s, &ctx_pic->slice[ctx_pic->slice_count++], position,
294 buffer, size);
295 return 0;
296 }
297
dxva2_mpeg2_end_frame(AVCodecContext * avctx)298 static int dxva2_mpeg2_end_frame(AVCodecContext *avctx)
299 {
300 struct MpegEncContext *s = avctx->priv_data;
301 struct dxva2_picture_context *ctx_pic =
302 s->current_picture_ptr->hwaccel_picture_private;
303 int ret;
304
305 if (ctx_pic->slice_count <= 0 || ctx_pic->bitstream_size <= 0)
306 return -1;
307 ret = ff_dxva2_common_end_frame(avctx, s->current_picture_ptr->f,
308 &ctx_pic->pp, sizeof(ctx_pic->pp),
309 &ctx_pic->qm, sizeof(ctx_pic->qm),
310 commit_bitstream_and_slice_buffer);
311 if (!ret)
312 ff_mpeg_draw_horiz_band(s, 0, avctx->height);
313 return ret;
314 }
315
316 #if CONFIG_MPEG2_DXVA2_HWACCEL
317 const AVHWAccel ff_mpeg2_dxva2_hwaccel = {
318 .name = "mpeg2_dxva2",
319 .type = AVMEDIA_TYPE_VIDEO,
320 .id = AV_CODEC_ID_MPEG2VIDEO,
321 .pix_fmt = AV_PIX_FMT_DXVA2_VLD,
322 .init = ff_dxva2_decode_init,
323 .uninit = ff_dxva2_decode_uninit,
324 .start_frame = dxva2_mpeg2_start_frame,
325 .decode_slice = dxva2_mpeg2_decode_slice,
326 .end_frame = dxva2_mpeg2_end_frame,
327 .frame_params = ff_dxva2_common_frame_params,
328 .frame_priv_data_size = sizeof(struct dxva2_picture_context),
329 .priv_data_size = sizeof(FFDXVASharedContext),
330 };
331 #endif
332
333 #if CONFIG_MPEG2_D3D11VA_HWACCEL
334 const AVHWAccel ff_mpeg2_d3d11va_hwaccel = {
335 .name = "mpeg2_d3d11va",
336 .type = AVMEDIA_TYPE_VIDEO,
337 .id = AV_CODEC_ID_MPEG2VIDEO,
338 .pix_fmt = AV_PIX_FMT_D3D11VA_VLD,
339 .init = ff_dxva2_decode_init,
340 .uninit = ff_dxva2_decode_uninit,
341 .start_frame = dxva2_mpeg2_start_frame,
342 .decode_slice = dxva2_mpeg2_decode_slice,
343 .end_frame = dxva2_mpeg2_end_frame,
344 .frame_params = ff_dxva2_common_frame_params,
345 .frame_priv_data_size = sizeof(struct dxva2_picture_context),
346 .priv_data_size = sizeof(FFDXVASharedContext),
347 };
348 #endif
349
350 #if CONFIG_MPEG2_D3D11VA2_HWACCEL
351 const AVHWAccel ff_mpeg2_d3d11va2_hwaccel = {
352 .name = "mpeg2_d3d11va2",
353 .type = AVMEDIA_TYPE_VIDEO,
354 .id = AV_CODEC_ID_MPEG2VIDEO,
355 .pix_fmt = AV_PIX_FMT_D3D11,
356 .init = ff_dxva2_decode_init,
357 .uninit = ff_dxva2_decode_uninit,
358 .start_frame = dxva2_mpeg2_start_frame,
359 .decode_slice = dxva2_mpeg2_decode_slice,
360 .end_frame = dxva2_mpeg2_end_frame,
361 .frame_params = ff_dxva2_common_frame_params,
362 .frame_priv_data_size = sizeof(struct dxva2_picture_context),
363 .priv_data_size = sizeof(FFDXVASharedContext),
364 };
365 #endif
366