1 /*
2  * MPEG-2 HW acceleration.
3  *
4  * copyright (c) 2010 Laurent Aimar
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "libavutil/log.h"
24 
25 #include "dxva2_internal.h"
26 #include "mpegutils.h"
27 #include "mpegvideo.h"
28 
29 #define MAX_SLICES 1024
30 struct dxva2_picture_context {
31     DXVA_PictureParameters pp;
32     DXVA_QmatrixData       qm;
33     unsigned               slice_count;
34     DXVA_SliceInfo         slice[MAX_SLICES];
35 
36     const uint8_t          *bitstream;
37     unsigned               bitstream_size;
38 };
39 
fill_picture_parameters(AVCodecContext * avctx,AVDXVAContext * ctx,const struct MpegEncContext * s,DXVA_PictureParameters * pp)40 static void fill_picture_parameters(AVCodecContext *avctx,
41                                     AVDXVAContext *ctx,
42                                     const struct MpegEncContext *s,
43                                     DXVA_PictureParameters *pp)
44 {
45     const Picture *current_picture = s->current_picture_ptr;
46     int is_field = s->picture_structure != PICT_FRAME;
47 
48     memset(pp, 0, sizeof(*pp));
49     pp->wDecodedPictureIndex         = ff_dxva2_get_surface_index(avctx, ctx, current_picture->f);
50     pp->wDeblockedPictureIndex       = 0;
51     if (s->pict_type != AV_PICTURE_TYPE_I)
52         pp->wForwardRefPictureIndex  = ff_dxva2_get_surface_index(avctx, ctx, s->last_picture.f);
53     else
54         pp->wForwardRefPictureIndex  = 0xffff;
55     if (s->pict_type == AV_PICTURE_TYPE_B)
56         pp->wBackwardRefPictureIndex = ff_dxva2_get_surface_index(avctx, ctx, s->next_picture.f);
57     else
58         pp->wBackwardRefPictureIndex = 0xffff;
59     pp->wPicWidthInMBminus1          = s->mb_width  - 1;
60     pp->wPicHeightInMBminus1         = (s->mb_height >> is_field) - 1;
61     pp->bMacroblockWidthMinus1       = 15;
62     pp->bMacroblockHeightMinus1      = 15;
63     pp->bBlockWidthMinus1            = 7;
64     pp->bBlockHeightMinus1           = 7;
65     pp->bBPPminus1                   = 7;
66     pp->bPicStructure                = s->picture_structure;
67     pp->bSecondField                 = is_field && !s->first_field;
68     pp->bPicIntra                    = s->pict_type == AV_PICTURE_TYPE_I;
69     pp->bPicBackwardPrediction       = s->pict_type == AV_PICTURE_TYPE_B;
70     pp->bBidirectionalAveragingMode  = 0;
71     pp->bMVprecisionAndChromaRelation= 0; /* FIXME */
72     pp->bChromaFormat                = s->chroma_format;
73     pp->bPicScanFixed                = 1;
74     pp->bPicScanMethod               = s->alternate_scan ? 1 : 0;
75     pp->bPicReadbackRequests         = 0;
76     pp->bRcontrol                    = 0;
77     pp->bPicSpatialResid8            = 0;
78     pp->bPicOverflowBlocks           = 0;
79     pp->bPicExtrapolation            = 0;
80     pp->bPicDeblocked                = 0;
81     pp->bPicDeblockConfined          = 0;
82     pp->bPic4MVallowed               = 0;
83     pp->bPicOBMC                     = 0;
84     pp->bPicBinPB                    = 0;
85     pp->bMV_RPS                      = 0;
86     pp->bReservedBits                = 0;
87     pp->wBitstreamFcodes             = (s->mpeg_f_code[0][0] << 12) |
88                                        (s->mpeg_f_code[0][1] <<  8) |
89                                        (s->mpeg_f_code[1][0] <<  4) |
90                                        (s->mpeg_f_code[1][1]      );
91     pp->wBitstreamPCEelements        = (s->intra_dc_precision         << 14) |
92                                        (s->picture_structure          << 12) |
93                                        (s->top_field_first            << 11) |
94                                        (s->frame_pred_frame_dct       << 10) |
95                                        (s->concealment_motion_vectors <<  9) |
96                                        (s->q_scale_type               <<  8) |
97                                        (s->intra_vlc_format           <<  7) |
98                                        (s->alternate_scan             <<  6) |
99                                        (s->repeat_first_field         <<  5) |
100                                        (s->chroma_420_type            <<  4) |
101                                        (s->progressive_frame          <<  3);
102     pp->bBitstreamConcealmentNeed    = 0;
103     pp->bBitstreamConcealmentMethod  = 0;
104 }
105 
fill_quantization_matrices(AVCodecContext * avctx,AVDXVAContext * ctx,const struct MpegEncContext * s,DXVA_QmatrixData * qm)106 static void fill_quantization_matrices(AVCodecContext *avctx,
107                                        AVDXVAContext *ctx,
108                                        const struct MpegEncContext *s,
109                                        DXVA_QmatrixData *qm)
110 {
111     int i;
112     for (i = 0; i < 4; i++)
113         qm->bNewQmatrix[i] = 1;
114     for (i = 0; i < 64; i++) {
115         int n = s->idsp.idct_permutation[ff_zigzag_direct[i]];
116         qm->Qmatrix[0][i] = s->intra_matrix[n];
117         qm->Qmatrix[1][i] = s->inter_matrix[n];
118         qm->Qmatrix[2][i] = s->chroma_intra_matrix[n];
119         qm->Qmatrix[3][i] = s->chroma_inter_matrix[n];
120     }
121 }
122 
fill_slice(AVCodecContext * avctx,const struct MpegEncContext * s,DXVA_SliceInfo * slice,unsigned position,const uint8_t * buffer,unsigned size)123 static void fill_slice(AVCodecContext *avctx,
124                        const struct MpegEncContext *s,
125                        DXVA_SliceInfo *slice,
126                        unsigned position,
127                        const uint8_t *buffer, unsigned size)
128 {
129     int is_field = s->picture_structure != PICT_FRAME;
130     GetBitContext gb;
131 
132     memset(slice, 0, sizeof(*slice));
133     slice->wHorizontalPosition = s->mb_x;
134     slice->wVerticalPosition   = s->mb_y >> is_field;
135     slice->dwSliceBitsInBuffer = 8 * size;
136     slice->dwSliceDataLocation = position;
137     slice->bStartCodeBitOffset = 0;
138     slice->bReservedBits       = 0;
139     /* XXX We store the index of the first MB and it will be fixed later */
140     slice->wNumberMBsInSlice   = (s->mb_y >> is_field) * s->mb_width + s->mb_x;
141     slice->wBadSliceChopping   = 0;
142 
143     init_get_bits(&gb, &buffer[4], 8 * (size - 4));
144 
145     slice->wQuantizerScaleCode = get_bits(&gb, 5);
146     skip_1stop_8data_bits(&gb);
147 
148     slice->wMBbitOffset        = 4 * 8 + get_bits_count(&gb);
149 }
commit_bitstream_and_slice_buffer(AVCodecContext * avctx,DECODER_BUFFER_DESC * bs,DECODER_BUFFER_DESC * sc)150 static int commit_bitstream_and_slice_buffer(AVCodecContext *avctx,
151                                              DECODER_BUFFER_DESC *bs,
152                                              DECODER_BUFFER_DESC *sc)
153 {
154     const struct MpegEncContext *s = avctx->priv_data;
155     AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
156     struct dxva2_picture_context *ctx_pic =
157         s->current_picture_ptr->hwaccel_picture_private;
158     const int is_field = s->picture_structure != PICT_FRAME;
159     const unsigned mb_count = s->mb_width * (s->mb_height >> is_field);
160     void     *dxva_data_ptr;
161     uint8_t  *dxva_data, *current, *end;
162     unsigned dxva_size;
163     unsigned i;
164     unsigned type;
165 
166 #if CONFIG_D3D11VA
167     if (ff_dxva2_is_d3d11(avctx)) {
168         type = D3D11_VIDEO_DECODER_BUFFER_BITSTREAM;
169         if (FAILED(ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context,
170                                                        D3D11VA_CONTEXT(ctx)->decoder,
171                                                        type,
172                                                        &dxva_size, &dxva_data_ptr)))
173             return -1;
174     }
175 #endif
176 #if CONFIG_DXVA2
177     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
178         type = DXVA2_BitStreamDateBufferType;
179         if (FAILED(IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder,
180                                                   type,
181                                                   &dxva_data_ptr, &dxva_size)))
182             return -1;
183     }
184 #endif
185 
186     dxva_data = dxva_data_ptr;
187     current = dxva_data;
188     end = dxva_data + dxva_size;
189 
190     for (i = 0; i < ctx_pic->slice_count; i++) {
191         DXVA_SliceInfo *slice = &ctx_pic->slice[i];
192         unsigned position = slice->dwSliceDataLocation;
193         unsigned size     = slice->dwSliceBitsInBuffer / 8;
194         if (size > end - current) {
195             av_log(avctx, AV_LOG_ERROR, "Failed to build bitstream");
196             break;
197         }
198         slice->dwSliceDataLocation = current - dxva_data;
199 
200         if (i < ctx_pic->slice_count - 1)
201             slice->wNumberMBsInSlice =
202                 slice[1].wNumberMBsInSlice - slice[0].wNumberMBsInSlice;
203         else
204             slice->wNumberMBsInSlice =
205                 mb_count - slice[0].wNumberMBsInSlice;
206 
207         memcpy(current, &ctx_pic->bitstream[position], size);
208         current += size;
209     }
210 #if CONFIG_D3D11VA
211     if (ff_dxva2_is_d3d11(avctx))
212         if (FAILED(ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type)))
213             return -1;
214 #endif
215 #if CONFIG_DXVA2
216     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
217         if (FAILED(IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type)))
218             return -1;
219 #endif
220     if (i < ctx_pic->slice_count)
221         return -1;
222 
223 #if CONFIG_D3D11VA
224     if (ff_dxva2_is_d3d11(avctx)) {
225         D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = bs;
226         memset(dsc11, 0, sizeof(*dsc11));
227         dsc11->BufferType           = type;
228         dsc11->DataSize             = current - dxva_data;
229         dsc11->NumMBsInBuffer       = mb_count;
230 
231         type = D3D11_VIDEO_DECODER_BUFFER_SLICE_CONTROL;
232     }
233 #endif
234 #if CONFIG_DXVA2
235     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
236         DXVA2_DecodeBufferDesc *dsc2 = bs;
237         memset(dsc2, 0, sizeof(*dsc2));
238         dsc2->CompressedBufferType = type;
239         dsc2->DataSize             = current - dxva_data;
240         dsc2->NumMBsInBuffer       = mb_count;
241 
242         type = DXVA2_SliceControlBufferType;
243     }
244 #endif
245 
246     return ff_dxva2_commit_buffer(avctx, ctx, sc,
247                                   type,
248                                   ctx_pic->slice,
249                                   ctx_pic->slice_count * sizeof(*ctx_pic->slice),
250                                   mb_count);
251 }
252 
dxva2_mpeg2_start_frame(AVCodecContext * avctx,av_unused const uint8_t * buffer,av_unused uint32_t size)253 static int dxva2_mpeg2_start_frame(AVCodecContext *avctx,
254                                    av_unused const uint8_t *buffer,
255                                    av_unused uint32_t size)
256 {
257     const struct MpegEncContext *s = avctx->priv_data;
258     AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
259     struct dxva2_picture_context *ctx_pic =
260         s->current_picture_ptr->hwaccel_picture_private;
261 
262     if (!DXVA_CONTEXT_VALID(avctx, ctx))
263         return -1;
264     assert(ctx_pic);
265 
266     fill_picture_parameters(avctx, ctx, s, &ctx_pic->pp);
267     fill_quantization_matrices(avctx, ctx, s, &ctx_pic->qm);
268 
269     ctx_pic->slice_count    = 0;
270     ctx_pic->bitstream_size = 0;
271     ctx_pic->bitstream      = NULL;
272     return 0;
273 }
274 
dxva2_mpeg2_decode_slice(AVCodecContext * avctx,const uint8_t * buffer,uint32_t size)275 static int dxva2_mpeg2_decode_slice(AVCodecContext *avctx,
276                                     const uint8_t *buffer, uint32_t size)
277 {
278     const struct MpegEncContext *s = avctx->priv_data;
279     struct dxva2_picture_context *ctx_pic =
280         s->current_picture_ptr->hwaccel_picture_private;
281     unsigned position;
282 
283     if (ctx_pic->slice_count >= MAX_SLICES) {
284         avpriv_request_sample(avctx, "%d slices in dxva2",
285                               ctx_pic->slice_count);
286         return -1;
287     }
288     if (!ctx_pic->bitstream)
289         ctx_pic->bitstream = buffer;
290     ctx_pic->bitstream_size += size;
291 
292     position = buffer - ctx_pic->bitstream;
293     fill_slice(avctx, s, &ctx_pic->slice[ctx_pic->slice_count++], position,
294                buffer, size);
295     return 0;
296 }
297 
dxva2_mpeg2_end_frame(AVCodecContext * avctx)298 static int dxva2_mpeg2_end_frame(AVCodecContext *avctx)
299 {
300     struct MpegEncContext *s = avctx->priv_data;
301     struct dxva2_picture_context *ctx_pic =
302         s->current_picture_ptr->hwaccel_picture_private;
303     int ret;
304 
305     if (ctx_pic->slice_count <= 0 || ctx_pic->bitstream_size <= 0)
306         return -1;
307     ret = ff_dxva2_common_end_frame(avctx, s->current_picture_ptr->f,
308                                     &ctx_pic->pp, sizeof(ctx_pic->pp),
309                                     &ctx_pic->qm, sizeof(ctx_pic->qm),
310                                     commit_bitstream_and_slice_buffer);
311     if (!ret)
312         ff_mpeg_draw_horiz_band(s, 0, avctx->height);
313     return ret;
314 }
315 
316 #if CONFIG_MPEG2_DXVA2_HWACCEL
317 const AVHWAccel ff_mpeg2_dxva2_hwaccel = {
318     .name           = "mpeg2_dxva2",
319     .type           = AVMEDIA_TYPE_VIDEO,
320     .id             = AV_CODEC_ID_MPEG2VIDEO,
321     .pix_fmt        = AV_PIX_FMT_DXVA2_VLD,
322     .init           = ff_dxva2_decode_init,
323     .uninit         = ff_dxva2_decode_uninit,
324     .start_frame    = dxva2_mpeg2_start_frame,
325     .decode_slice   = dxva2_mpeg2_decode_slice,
326     .end_frame      = dxva2_mpeg2_end_frame,
327     .frame_params   = ff_dxva2_common_frame_params,
328     .frame_priv_data_size = sizeof(struct dxva2_picture_context),
329     .priv_data_size = sizeof(FFDXVASharedContext),
330 };
331 #endif
332 
333 #if CONFIG_MPEG2_D3D11VA_HWACCEL
334 const AVHWAccel ff_mpeg2_d3d11va_hwaccel = {
335     .name           = "mpeg2_d3d11va",
336     .type           = AVMEDIA_TYPE_VIDEO,
337     .id             = AV_CODEC_ID_MPEG2VIDEO,
338     .pix_fmt        = AV_PIX_FMT_D3D11VA_VLD,
339     .init           = ff_dxva2_decode_init,
340     .uninit         = ff_dxva2_decode_uninit,
341     .start_frame    = dxva2_mpeg2_start_frame,
342     .decode_slice   = dxva2_mpeg2_decode_slice,
343     .end_frame      = dxva2_mpeg2_end_frame,
344     .frame_params   = ff_dxva2_common_frame_params,
345     .frame_priv_data_size = sizeof(struct dxva2_picture_context),
346     .priv_data_size = sizeof(FFDXVASharedContext),
347 };
348 #endif
349 
350 #if CONFIG_MPEG2_D3D11VA2_HWACCEL
351 const AVHWAccel ff_mpeg2_d3d11va2_hwaccel = {
352     .name           = "mpeg2_d3d11va2",
353     .type           = AVMEDIA_TYPE_VIDEO,
354     .id             = AV_CODEC_ID_MPEG2VIDEO,
355     .pix_fmt        = AV_PIX_FMT_D3D11,
356     .init           = ff_dxva2_decode_init,
357     .uninit         = ff_dxva2_decode_uninit,
358     .start_frame    = dxva2_mpeg2_start_frame,
359     .decode_slice   = dxva2_mpeg2_decode_slice,
360     .end_frame      = dxva2_mpeg2_end_frame,
361     .frame_params   = ff_dxva2_common_frame_params,
362     .frame_priv_data_size = sizeof(struct dxva2_picture_context),
363     .priv_data_size = sizeof(FFDXVASharedContext),
364 };
365 #endif
366