1 /*
2  * Video Decode and Presentation API for UNIX (VDPAU) is used for
3  * HW decode acceleration for MPEG-1/2, MPEG-4 ASP, H.264 and VC-1.
4  *
5  * Copyright (c) 2008 NVIDIA
6  *
7  * This file is part of FFmpeg.
8  *
9  * FFmpeg is free software; you can redistribute it and/or
10  * modify it under the terms of the GNU Lesser General Public
11  * License as published by the Free Software Foundation; either
12  * version 2.1 of the License, or (at your option) any later version.
13  *
14  * FFmpeg is distributed in the hope that it will be useful,
15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
17  * Lesser General Public License for more details.
18  *
19  * You should have received a copy of the GNU Lesser General Public
20  * License along with FFmpeg; if not, write to the Free Software
21  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22  */
23 
24 #include <limits.h>
25 
26 #include "avcodec.h"
27 #include "decode.h"
28 #include "internal.h"
29 #include "h264dec.h"
30 #include "vc1.h"
31 #include "vdpau.h"
32 #include "vdpau_internal.h"
33 
34 // XXX: at the time of adding this ifdefery, av_assert* wasn't use outside.
35 // When dropping it, make sure other av_assert* were not added since then.
36 
37 /**
38  * @addtogroup VDPAU_Decoding
39  *
40  * @{
41  */
42 
vdpau_error(VdpStatus status)43 static int vdpau_error(VdpStatus status)
44 {
45     switch (status) {
46     case VDP_STATUS_OK:
47         return 0;
48     case VDP_STATUS_NO_IMPLEMENTATION:
49         return AVERROR(ENOSYS);
50     case VDP_STATUS_DISPLAY_PREEMPTED:
51         return AVERROR(EIO);
52     case VDP_STATUS_INVALID_HANDLE:
53         return AVERROR(EBADF);
54     case VDP_STATUS_INVALID_POINTER:
55         return AVERROR(EFAULT);
56     case VDP_STATUS_RESOURCES:
57         return AVERROR(ENOBUFS);
58     case VDP_STATUS_HANDLE_DEVICE_MISMATCH:
59         return AVERROR(EXDEV);
60     case VDP_STATUS_ERROR:
61         return AVERROR(EIO);
62     default:
63         return AVERROR(EINVAL);
64     }
65 }
66 
av_alloc_vdpaucontext(void)67 AVVDPAUContext *av_alloc_vdpaucontext(void)
68 {
69     return av_vdpau_alloc_context();
70 }
71 
MAKE_ACCESSORS(AVVDPAUContext,vdpau_hwaccel,AVVDPAU_Render2,render2)72 MAKE_ACCESSORS(AVVDPAUContext, vdpau_hwaccel, AVVDPAU_Render2, render2)
73 
74 int av_vdpau_get_surface_parameters(AVCodecContext *avctx,
75                                     VdpChromaType *type,
76                                     uint32_t *width, uint32_t *height)
77 {
78     VdpChromaType t;
79     uint32_t w = avctx->coded_width;
80     uint32_t h = avctx->coded_height;
81 
82     /* See <vdpau/vdpau.h> for per-type alignment constraints. */
83     switch (avctx->sw_pix_fmt) {
84     case AV_PIX_FMT_YUV420P:
85     case AV_PIX_FMT_YUVJ420P:
86     case AV_PIX_FMT_YUV420P10:
87     case AV_PIX_FMT_YUV420P12:
88         t = VDP_CHROMA_TYPE_420;
89         w = (w + 1) & ~1;
90         h = (h + 3) & ~3;
91         break;
92     case AV_PIX_FMT_YUV422P:
93     case AV_PIX_FMT_YUVJ422P:
94         t = VDP_CHROMA_TYPE_422;
95         w = (w + 1) & ~1;
96         h = (h + 1) & ~1;
97         break;
98     case AV_PIX_FMT_YUV444P:
99     case AV_PIX_FMT_YUVJ444P:
100     case AV_PIX_FMT_YUV444P10:
101     case AV_PIX_FMT_YUV444P12:
102         t = VDP_CHROMA_TYPE_444;
103         h = (h + 1) & ~1;
104         break;
105     default:
106         return AVERROR(ENOSYS);
107     }
108 
109     if (type)
110         *type = t;
111     if (width)
112         *width = w;
113     if (height)
114         *height = h;
115     return 0;
116 }
117 
ff_vdpau_common_frame_params(AVCodecContext * avctx,AVBufferRef * hw_frames_ctx)118 int ff_vdpau_common_frame_params(AVCodecContext *avctx,
119                                  AVBufferRef *hw_frames_ctx)
120 {
121     AVHWFramesContext *hw_frames = (AVHWFramesContext*)hw_frames_ctx->data;
122     VdpChromaType type;
123     uint32_t width;
124     uint32_t height;
125 
126     if (av_vdpau_get_surface_parameters(avctx, &type, &width, &height))
127         return AVERROR(EINVAL);
128 
129     hw_frames->format    = AV_PIX_FMT_VDPAU;
130     hw_frames->sw_format = avctx->sw_pix_fmt;
131     hw_frames->width     = width;
132     hw_frames->height    = height;
133 
134     return 0;
135 }
136 
ff_vdpau_common_init(AVCodecContext * avctx,VdpDecoderProfile profile,int level)137 int ff_vdpau_common_init(AVCodecContext *avctx, VdpDecoderProfile profile,
138                          int level)
139 {
140     VDPAUHWContext *hwctx = avctx->hwaccel_context;
141     VDPAUContext *vdctx = avctx->internal->hwaccel_priv_data;
142     VdpVideoSurfaceQueryCapabilities *surface_query_caps;
143     VdpDecoderQueryCapabilities *decoder_query_caps;
144     VdpDecoderCreate *create;
145     VdpGetInformationString *info;
146     const char *info_string;
147     void *func;
148     VdpStatus status;
149     VdpBool supported;
150     uint32_t max_level, max_mb, max_width, max_height;
151     VdpChromaType type;
152     uint32_t width;
153     uint32_t height;
154     int ret;
155 
156     vdctx->width            = UINT32_MAX;
157     vdctx->height           = UINT32_MAX;
158 
159     if (av_vdpau_get_surface_parameters(avctx, &type, &width, &height))
160         return AVERROR(ENOSYS);
161 
162     if (hwctx) {
163         hwctx->reset            = 0;
164 
165         if (hwctx->context.decoder != VDP_INVALID_HANDLE) {
166             vdctx->decoder = hwctx->context.decoder;
167             vdctx->render  = hwctx->context.render;
168             vdctx->device  = VDP_INVALID_HANDLE;
169             return 0; /* Decoder created by user */
170         }
171 
172         vdctx->device           = hwctx->device;
173         vdctx->get_proc_address = hwctx->get_proc_address;
174 
175         if (hwctx->flags & AV_HWACCEL_FLAG_IGNORE_LEVEL)
176             level = 0;
177 
178         if (!(hwctx->flags & AV_HWACCEL_FLAG_ALLOW_HIGH_DEPTH) &&
179             type != VDP_CHROMA_TYPE_420)
180             return AVERROR(ENOSYS);
181     } else {
182         AVHWFramesContext *frames_ctx;
183         AVVDPAUDeviceContext *dev_ctx;
184 
185         ret = ff_decode_get_hw_frames_ctx(avctx, AV_HWDEVICE_TYPE_VDPAU);
186         if (ret < 0)
187             return ret;
188 
189         frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
190         dev_ctx = frames_ctx->device_ctx->hwctx;
191 
192         vdctx->device           = dev_ctx->device;
193         vdctx->get_proc_address = dev_ctx->get_proc_address;
194 
195         if (avctx->hwaccel_flags & AV_HWACCEL_FLAG_IGNORE_LEVEL)
196             level = 0;
197     }
198 
199     if (level < 0)
200         return AVERROR(ENOTSUP);
201 
202     status = vdctx->get_proc_address(vdctx->device,
203                                      VDP_FUNC_ID_GET_INFORMATION_STRING,
204                                      &func);
205     if (status != VDP_STATUS_OK)
206         return vdpau_error(status);
207     else
208         info = func;
209 
210     status = info(&info_string);
211     if (status != VDP_STATUS_OK)
212         return vdpau_error(status);
213     if (avctx->codec_id == AV_CODEC_ID_HEVC && strncmp(info_string, "NVIDIA ", 7) == 0 &&
214         !(avctx->hwaccel_flags & AV_HWACCEL_FLAG_ALLOW_PROFILE_MISMATCH)) {
215         int driver_version = 0;
216         sscanf(info_string, "NVIDIA VDPAU Driver Shared Library  %d", &driver_version);
217         if (driver_version < 410) {
218             av_log(avctx, AV_LOG_VERBOSE, "HEVC with NVIDIA VDPAU drivers is buggy, skipping.\n");
219             return AVERROR(ENOTSUP);
220         }
221     }
222 
223     status = vdctx->get_proc_address(vdctx->device,
224                                      VDP_FUNC_ID_VIDEO_SURFACE_QUERY_CAPABILITIES,
225                                      &func);
226     if (status != VDP_STATUS_OK)
227         return vdpau_error(status);
228     else
229         surface_query_caps = func;
230 
231     status = surface_query_caps(vdctx->device, type, &supported,
232                                 &max_width, &max_height);
233     if (status != VDP_STATUS_OK)
234         return vdpau_error(status);
235     if (supported != VDP_TRUE ||
236         max_width < width || max_height < height)
237         return AVERROR(ENOTSUP);
238 
239     status = vdctx->get_proc_address(vdctx->device,
240                                      VDP_FUNC_ID_DECODER_QUERY_CAPABILITIES,
241                                      &func);
242     if (status != VDP_STATUS_OK)
243         return vdpau_error(status);
244     else
245         decoder_query_caps = func;
246 
247     status = decoder_query_caps(vdctx->device, profile, &supported, &max_level,
248                                 &max_mb, &max_width, &max_height);
249 #ifdef VDP_DECODER_PROFILE_H264_CONSTRAINED_BASELINE
250     if ((status != VDP_STATUS_OK || supported != VDP_TRUE) && profile == VDP_DECODER_PROFILE_H264_CONSTRAINED_BASELINE) {
251         profile = VDP_DECODER_PROFILE_H264_MAIN;
252         status = decoder_query_caps(vdctx->device, profile, &supported,
253                                     &max_level, &max_mb,
254                                     &max_width, &max_height);
255     }
256 #endif
257     if (status != VDP_STATUS_OK)
258         return vdpau_error(status);
259 
260     if (supported != VDP_TRUE || max_level < level ||
261         max_width < width || max_height < height)
262         return AVERROR(ENOTSUP);
263 
264     status = vdctx->get_proc_address(vdctx->device, VDP_FUNC_ID_DECODER_CREATE,
265                                      &func);
266     if (status != VDP_STATUS_OK)
267         return vdpau_error(status);
268     else
269         create = func;
270 
271     status = vdctx->get_proc_address(vdctx->device, VDP_FUNC_ID_DECODER_RENDER,
272                                      &func);
273     if (status != VDP_STATUS_OK)
274         return vdpau_error(status);
275     else
276         vdctx->render = func;
277 
278     status = create(vdctx->device, profile, width, height, avctx->refs,
279                     &vdctx->decoder);
280     if (status == VDP_STATUS_OK) {
281         vdctx->width  = avctx->coded_width;
282         vdctx->height = avctx->coded_height;
283     }
284 
285     return vdpau_error(status);
286 }
287 
ff_vdpau_common_uninit(AVCodecContext * avctx)288 int ff_vdpau_common_uninit(AVCodecContext *avctx)
289 {
290     VDPAUContext *vdctx = avctx->internal->hwaccel_priv_data;
291     VdpDecoderDestroy *destroy;
292     void *func;
293     VdpStatus status;
294 
295     if (vdctx->device == VDP_INVALID_HANDLE)
296         return 0; /* Decoder created and destroyed by user */
297     if (vdctx->width == UINT32_MAX && vdctx->height == UINT32_MAX)
298         return 0;
299 
300     status = vdctx->get_proc_address(vdctx->device,
301                                      VDP_FUNC_ID_DECODER_DESTROY, &func);
302     if (status != VDP_STATUS_OK)
303         return vdpau_error(status);
304     else
305         destroy = func;
306 
307     status = destroy(vdctx->decoder);
308     return vdpau_error(status);
309 }
310 
ff_vdpau_common_reinit(AVCodecContext * avctx)311 static int ff_vdpau_common_reinit(AVCodecContext *avctx)
312 {
313     VDPAUHWContext *hwctx = avctx->hwaccel_context;
314     VDPAUContext *vdctx = avctx->internal->hwaccel_priv_data;
315 
316     if (vdctx->device == VDP_INVALID_HANDLE)
317         return 0; /* Decoder created by user */
318     if (avctx->coded_width == vdctx->width &&
319         avctx->coded_height == vdctx->height && (!hwctx || !hwctx->reset))
320         return 0;
321 
322     avctx->hwaccel->uninit(avctx);
323     return avctx->hwaccel->init(avctx);
324 }
325 
ff_vdpau_common_start_frame(struct vdpau_picture_context * pic_ctx,av_unused const uint8_t * buffer,av_unused uint32_t size)326 int ff_vdpau_common_start_frame(struct vdpau_picture_context *pic_ctx,
327                                 av_unused const uint8_t *buffer,
328                                 av_unused uint32_t size)
329 {
330     pic_ctx->bitstream_buffers_allocated = 0;
331     pic_ctx->bitstream_buffers_used      = 0;
332     pic_ctx->bitstream_buffers           = NULL;
333     return 0;
334 }
335 
ff_vdpau_common_end_frame(AVCodecContext * avctx,AVFrame * frame,struct vdpau_picture_context * pic_ctx)336 int ff_vdpau_common_end_frame(AVCodecContext *avctx, AVFrame *frame,
337                               struct vdpau_picture_context *pic_ctx)
338 {
339     VDPAUContext *vdctx = avctx->internal->hwaccel_priv_data;
340     AVVDPAUContext *hwctx = avctx->hwaccel_context;
341     VdpVideoSurface surf = ff_vdpau_get_surface_id(frame);
342     VdpStatus status;
343     int val;
344 
345     val = ff_vdpau_common_reinit(avctx);
346     if (val < 0)
347         return val;
348 
349     if (hwctx && !hwctx->render && hwctx->render2) {
350         status = hwctx->render2(avctx, frame, (void *)&pic_ctx->info,
351                                 pic_ctx->bitstream_buffers_used, pic_ctx->bitstream_buffers);
352     } else
353     status = vdctx->render(vdctx->decoder, surf, &pic_ctx->info,
354                            pic_ctx->bitstream_buffers_used,
355                            pic_ctx->bitstream_buffers);
356 
357     av_freep(&pic_ctx->bitstream_buffers);
358 
359     return vdpau_error(status);
360 }
361 
362 #if CONFIG_MPEG1_VDPAU_HWACCEL || \
363     CONFIG_MPEG2_VDPAU_HWACCEL || CONFIG_MPEG4_VDPAU_HWACCEL || \
364     CONFIG_VC1_VDPAU_HWACCEL   || CONFIG_WMV3_VDPAU_HWACCEL
ff_vdpau_mpeg_end_frame(AVCodecContext * avctx)365 int ff_vdpau_mpeg_end_frame(AVCodecContext *avctx)
366 {
367     MpegEncContext *s = avctx->priv_data;
368     Picture *pic = s->current_picture_ptr;
369     struct vdpau_picture_context *pic_ctx = pic->hwaccel_picture_private;
370     int val;
371 
372     val = ff_vdpau_common_end_frame(avctx, pic->f, pic_ctx);
373     if (val < 0)
374         return val;
375 
376     ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
377     return 0;
378 }
379 #endif
380 
ff_vdpau_add_buffer(struct vdpau_picture_context * pic_ctx,const uint8_t * buf,uint32_t size)381 int ff_vdpau_add_buffer(struct vdpau_picture_context *pic_ctx,
382                         const uint8_t *buf, uint32_t size)
383 {
384     VdpBitstreamBuffer *buffers = pic_ctx->bitstream_buffers;
385 
386     buffers = av_fast_realloc(buffers, &pic_ctx->bitstream_buffers_allocated,
387                               (pic_ctx->bitstream_buffers_used + 1) * sizeof(*buffers));
388     if (!buffers)
389         return AVERROR(ENOMEM);
390 
391     pic_ctx->bitstream_buffers = buffers;
392     buffers += pic_ctx->bitstream_buffers_used++;
393 
394     buffers->struct_version  = VDP_BITSTREAM_BUFFER_VERSION;
395     buffers->bitstream       = buf;
396     buffers->bitstream_bytes = size;
397     return 0;
398 }
399 
400 #if FF_API_VDPAU_PROFILE
av_vdpau_get_profile(AVCodecContext * avctx,VdpDecoderProfile * profile)401 int av_vdpau_get_profile(AVCodecContext *avctx, VdpDecoderProfile *profile)
402 {
403 #define PROFILE(prof)                      \
404 do {                                       \
405     *profile = VDP_DECODER_PROFILE_##prof; \
406     return 0;                              \
407 } while (0)
408 
409     switch (avctx->codec_id) {
410     case AV_CODEC_ID_MPEG1VIDEO:               PROFILE(MPEG1);
411     case AV_CODEC_ID_MPEG2VIDEO:
412         switch (avctx->profile) {
413         case FF_PROFILE_MPEG2_MAIN:            PROFILE(MPEG2_MAIN);
414         case FF_PROFILE_MPEG2_SIMPLE:          PROFILE(MPEG2_SIMPLE);
415         default:                               return AVERROR(EINVAL);
416         }
417     case AV_CODEC_ID_H263:                     PROFILE(MPEG4_PART2_ASP);
418     case AV_CODEC_ID_MPEG4:
419         switch (avctx->profile) {
420         case FF_PROFILE_MPEG4_SIMPLE:          PROFILE(MPEG4_PART2_SP);
421         case FF_PROFILE_MPEG4_ADVANCED_SIMPLE: PROFILE(MPEG4_PART2_ASP);
422         default:                               return AVERROR(EINVAL);
423         }
424     case AV_CODEC_ID_H264:
425         switch (avctx->profile & ~FF_PROFILE_H264_INTRA) {
426         case FF_PROFILE_H264_BASELINE:         PROFILE(H264_BASELINE);
427         case FF_PROFILE_H264_CONSTRAINED_BASELINE:
428         case FF_PROFILE_H264_MAIN:             PROFILE(H264_MAIN);
429         case FF_PROFILE_H264_HIGH:             PROFILE(H264_HIGH);
430 #ifdef VDP_DECODER_PROFILE_H264_EXTENDED
431         case FF_PROFILE_H264_EXTENDED:         PROFILE(H264_EXTENDED);
432 #endif
433         default:                               return AVERROR(EINVAL);
434         }
435     case AV_CODEC_ID_WMV3:
436     case AV_CODEC_ID_VC1:
437         switch (avctx->profile) {
438         case FF_PROFILE_VC1_SIMPLE:            PROFILE(VC1_SIMPLE);
439         case FF_PROFILE_VC1_MAIN:              PROFILE(VC1_MAIN);
440         case FF_PROFILE_VC1_ADVANCED:          PROFILE(VC1_ADVANCED);
441         default:                               return AVERROR(EINVAL);
442         }
443     }
444     return AVERROR(EINVAL);
445 #undef PROFILE
446 }
447 #endif /* FF_API_VDPAU_PROFILE */
448 
av_vdpau_alloc_context(void)449 AVVDPAUContext *av_vdpau_alloc_context(void)
450 {
451     return av_mallocz(sizeof(VDPAUHWContext));
452 }
453 
av_vdpau_bind_context(AVCodecContext * avctx,VdpDevice device,VdpGetProcAddress * get_proc,unsigned flags)454 int av_vdpau_bind_context(AVCodecContext *avctx, VdpDevice device,
455                           VdpGetProcAddress *get_proc, unsigned flags)
456 {
457     VDPAUHWContext *hwctx;
458 
459     if (flags & ~(AV_HWACCEL_FLAG_IGNORE_LEVEL|AV_HWACCEL_FLAG_ALLOW_HIGH_DEPTH))
460         return AVERROR(EINVAL);
461 
462     if (av_reallocp(&avctx->hwaccel_context, sizeof(*hwctx)))
463         return AVERROR(ENOMEM);
464 
465     hwctx = avctx->hwaccel_context;
466 
467     memset(hwctx, 0, sizeof(*hwctx));
468     hwctx->context.decoder  = VDP_INVALID_HANDLE;
469     hwctx->device           = device;
470     hwctx->get_proc_address = get_proc;
471     hwctx->flags            = flags;
472     hwctx->reset            = 1;
473     return 0;
474 }
475 
476 /* @}*/
477