2 * Video Decode and Presentation API for UNIX (VDPAU) is used for
3 * HW decode acceleration for MPEG-1/2, MPEG-4 ASP, H.264 and VC-1.
5 * Copyright (c) 2008 NVIDIA
7 * This file is part of FFmpeg.
9 * FFmpeg is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
14 * FFmpeg is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with FFmpeg; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
33 #include "vdpau_internal.h"
36 * @addtogroup VDPAU_Decoding
41 AVVDPAUContext *av_alloc_vdpaucontext(void)
43 return av_vdpau_alloc_context();
46 MAKE_ACCESSORS(AVVDPAUContext, vdpau_hwaccel, AVVDPAU_Render2, render2)
48 int ff_vdpau_common_start_frame(Picture *pic,
49 av_unused const uint8_t *buffer,
50 av_unused uint32_t size)
52 struct vdpau_picture_context *pic_ctx = pic->hwaccel_picture_private;
54 pic_ctx->bitstream_buffers_allocated = 0;
55 pic_ctx->bitstream_buffers_used = 0;
56 pic_ctx->bitstream_buffers = NULL;
60 #if CONFIG_H263_VDPAU_HWACCEL || CONFIG_MPEG1_VDPAU_HWACCEL || \
61 CONFIG_MPEG2_VDPAU_HWACCEL || CONFIG_MPEG4_VDPAU_HWACCEL || \
62 CONFIG_VC1_VDPAU_HWACCEL || CONFIG_WMV3_VDPAU_HWACCEL
63 int ff_vdpau_mpeg_end_frame(AVCodecContext *avctx)
66 AVVDPAUContext *hwctx = avctx->hwaccel_context;
67 MpegEncContext *s = avctx->priv_data;
68 Picture *pic = s->current_picture_ptr;
69 struct vdpau_picture_context *pic_ctx = pic->hwaccel_picture_private;
70 VdpVideoSurface surf = ff_vdpau_get_surface_id(pic);
73 FF_DISABLE_DEPRECATION_WARNINGS
74 hwctx->info = pic_ctx->info;
75 hwctx->bitstream_buffers = pic_ctx->bitstream_buffers;
76 hwctx->bitstream_buffers_used = pic_ctx->bitstream_buffers_used;
77 hwctx->bitstream_buffers_allocated = pic_ctx->bitstream_buffers_allocated;
78 FF_ENABLE_DEPRECATION_WARNINGS
82 res = hwctx->render2(avctx, &pic->f, (void *)&pic_ctx->info,
83 pic_ctx->bitstream_buffers_used, pic_ctx->bitstream_buffers);
85 hwctx->render(hwctx->decoder, surf, (void *)&pic_ctx->info,
86 pic_ctx->bitstream_buffers_used, pic_ctx->bitstream_buffers);
88 ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
89 av_freep(&pic_ctx->bitstream_buffers);
92 FF_DISABLE_DEPRECATION_WARNINGS
93 hwctx->bitstream_buffers = NULL;
94 hwctx->bitstream_buffers_used = 0;
95 hwctx->bitstream_buffers_allocated = 0;
96 FF_ENABLE_DEPRECATION_WARNINGS
103 int ff_vdpau_add_buffer(Picture *pic, const uint8_t *buf, uint32_t size)
105 struct vdpau_picture_context *pic_ctx = pic->hwaccel_picture_private;
106 VdpBitstreamBuffer *buffers = pic_ctx->bitstream_buffers;
108 buffers = av_fast_realloc(buffers, &pic_ctx->bitstream_buffers_allocated,
109 (pic_ctx->bitstream_buffers_used + 1) * sizeof(*buffers));
111 return AVERROR(ENOMEM);
113 pic_ctx->bitstream_buffers = buffers;
114 buffers += pic_ctx->bitstream_buffers_used++;
116 buffers->struct_version = VDP_BITSTREAM_BUFFER_VERSION;
117 buffers->bitstream = buf;
118 buffers->bitstream_bytes = size;
122 /* Obsolete non-hwaccel VDPAU support below... */
124 void ff_vdpau_h264_set_reference_frames(H264Context *h)
126 struct vdpau_render_state *render, *render_ref;
127 VdpReferenceFrameH264 *rf, *rf2;
129 int i, list, pic_frame_idx;
131 render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0];
134 rf = &render->info.h264.referenceFrames[0];
135 #define H264_RF_COUNT FF_ARRAY_ELEMS(render->info.h264.referenceFrames)
137 for (list = 0; list < 2; ++list) {
138 Picture **lp = list ? h->long_ref : h->short_ref;
139 int ls = list ? 16 : h->short_ref_count;
141 for (i = 0; i < ls; ++i) {
143 if (!pic || !pic->reference)
145 pic_frame_idx = pic->long_ref ? pic->pic_id : pic->frame_num;
147 render_ref = (struct vdpau_render_state *)pic->f.data[0];
150 rf2 = &render->info.h264.referenceFrames[0];
153 (rf2->surface == render_ref->surface)
154 && (rf2->is_long_term == pic->long_ref)
155 && (rf2->frame_idx == pic_frame_idx)
161 rf2->top_is_reference |= (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE;
162 rf2->bottom_is_reference |= (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE;
166 if (rf >= &render->info.h264.referenceFrames[H264_RF_COUNT])
169 rf->surface = render_ref->surface;
170 rf->is_long_term = pic->long_ref;
171 rf->top_is_reference = (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE;
172 rf->bottom_is_reference = (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE;
173 rf->field_order_cnt[0] = pic->field_poc[0];
174 rf->field_order_cnt[1] = pic->field_poc[1];
175 rf->frame_idx = pic_frame_idx;
181 for (; rf < &render->info.h264.referenceFrames[H264_RF_COUNT]; ++rf) {
182 rf->surface = VDP_INVALID_HANDLE;
183 rf->is_long_term = 0;
184 rf->top_is_reference = 0;
185 rf->bottom_is_reference = 0;
186 rf->field_order_cnt[0] = 0;
187 rf->field_order_cnt[1] = 0;
192 void ff_vdpau_add_data_chunk(uint8_t *data, const uint8_t *buf, int buf_size)
194 struct vdpau_render_state *render = (struct vdpau_render_state*)data;
197 render->bitstream_buffers= av_fast_realloc(
198 render->bitstream_buffers,
199 &render->bitstream_buffers_allocated,
200 sizeof(*render->bitstream_buffers)*(render->bitstream_buffers_used + 1)
203 render->bitstream_buffers[render->bitstream_buffers_used].struct_version = VDP_BITSTREAM_BUFFER_VERSION;
204 render->bitstream_buffers[render->bitstream_buffers_used].bitstream = buf;
205 render->bitstream_buffers[render->bitstream_buffers_used].bitstream_bytes = buf_size;
206 render->bitstream_buffers_used++;
209 #if CONFIG_H264_VDPAU_DECODER
210 void ff_vdpau_h264_picture_start(H264Context *h)
212 struct vdpau_render_state *render;
215 render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0];
218 for (i = 0; i < 2; ++i) {
219 int foc = h->cur_pic_ptr->field_poc[i];
222 render->info.h264.field_order_cnt[i] = foc;
225 render->info.h264.frame_num = h->frame_num;
228 void ff_vdpau_h264_picture_complete(H264Context *h)
230 struct vdpau_render_state *render;
232 render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0];
235 render->info.h264.slice_count = h->slice_num;
236 if (render->info.h264.slice_count < 1)
239 render->info.h264.is_reference = (h->cur_pic_ptr->reference & 3) ? VDP_TRUE : VDP_FALSE;
240 render->info.h264.field_pic_flag = h->picture_structure != PICT_FRAME;
241 render->info.h264.bottom_field_flag = h->picture_structure == PICT_BOTTOM_FIELD;
242 render->info.h264.num_ref_frames = h->sps.ref_frame_count;
243 render->info.h264.mb_adaptive_frame_field_flag = h->sps.mb_aff && !render->info.h264.field_pic_flag;
244 render->info.h264.constrained_intra_pred_flag = h->pps.constrained_intra_pred;
245 render->info.h264.weighted_pred_flag = h->pps.weighted_pred;
246 render->info.h264.weighted_bipred_idc = h->pps.weighted_bipred_idc;
247 render->info.h264.frame_mbs_only_flag = h->sps.frame_mbs_only_flag;
248 render->info.h264.transform_8x8_mode_flag = h->pps.transform_8x8_mode;
249 render->info.h264.chroma_qp_index_offset = h->pps.chroma_qp_index_offset[0];
250 render->info.h264.second_chroma_qp_index_offset = h->pps.chroma_qp_index_offset[1];
251 render->info.h264.pic_init_qp_minus26 = h->pps.init_qp - 26;
252 render->info.h264.num_ref_idx_l0_active_minus1 = h->pps.ref_count[0] - 1;
253 render->info.h264.num_ref_idx_l1_active_minus1 = h->pps.ref_count[1] - 1;
254 render->info.h264.log2_max_frame_num_minus4 = h->sps.log2_max_frame_num - 4;
255 render->info.h264.pic_order_cnt_type = h->sps.poc_type;
256 render->info.h264.log2_max_pic_order_cnt_lsb_minus4 = h->sps.poc_type ? 0 : h->sps.log2_max_poc_lsb - 4;
257 render->info.h264.delta_pic_order_always_zero_flag = h->sps.delta_pic_order_always_zero_flag;
258 render->info.h264.direct_8x8_inference_flag = h->sps.direct_8x8_inference_flag;
259 render->info.h264.entropy_coding_mode_flag = h->pps.cabac;
260 render->info.h264.pic_order_present_flag = h->pps.pic_order_present;
261 render->info.h264.deblocking_filter_control_present_flag = h->pps.deblocking_filter_parameters_present;
262 render->info.h264.redundant_pic_cnt_present_flag = h->pps.redundant_pic_cnt_present;
263 memcpy(render->info.h264.scaling_lists_4x4, h->pps.scaling_matrix4, sizeof(render->info.h264.scaling_lists_4x4));
264 memcpy(render->info.h264.scaling_lists_8x8[0], h->pps.scaling_matrix8[0], sizeof(render->info.h264.scaling_lists_8x8[0]));
265 memcpy(render->info.h264.scaling_lists_8x8[1], h->pps.scaling_matrix8[3], sizeof(render->info.h264.scaling_lists_8x8[0]));
267 ff_h264_draw_horiz_band(h, 0, h->avctx->height);
268 render->bitstream_buffers_used = 0;
270 #endif /* CONFIG_H264_VDPAU_DECODER */
272 #if CONFIG_MPEG_VDPAU_DECODER || CONFIG_MPEG1_VDPAU_DECODER
273 void ff_vdpau_mpeg_picture_complete(MpegEncContext *s, const uint8_t *buf,
274 int buf_size, int slice_count)
276 struct vdpau_render_state *render, *last, *next;
279 if (!s->current_picture_ptr) return;
281 render = (struct vdpau_render_state *)s->current_picture_ptr->f.data[0];
284 /* fill VdpPictureInfoMPEG1Or2 struct */
285 render->info.mpeg.picture_structure = s->picture_structure;
286 render->info.mpeg.picture_coding_type = s->pict_type;
287 render->info.mpeg.intra_dc_precision = s->intra_dc_precision;
288 render->info.mpeg.frame_pred_frame_dct = s->frame_pred_frame_dct;
289 render->info.mpeg.concealment_motion_vectors = s->concealment_motion_vectors;
290 render->info.mpeg.intra_vlc_format = s->intra_vlc_format;
291 render->info.mpeg.alternate_scan = s->alternate_scan;
292 render->info.mpeg.q_scale_type = s->q_scale_type;
293 render->info.mpeg.top_field_first = s->top_field_first;
294 render->info.mpeg.full_pel_forward_vector = s->full_pel[0]; // MPEG-1 only. Set 0 for MPEG-2
295 render->info.mpeg.full_pel_backward_vector = s->full_pel[1]; // MPEG-1 only. Set 0 for MPEG-2
296 render->info.mpeg.f_code[0][0] = s->mpeg_f_code[0][0]; // For MPEG-1 fill both horiz. & vert.
297 render->info.mpeg.f_code[0][1] = s->mpeg_f_code[0][1];
298 render->info.mpeg.f_code[1][0] = s->mpeg_f_code[1][0];
299 render->info.mpeg.f_code[1][1] = s->mpeg_f_code[1][1];
300 for (i = 0; i < 64; ++i) {
301 render->info.mpeg.intra_quantizer_matrix[i] = s->intra_matrix[i];
302 render->info.mpeg.non_intra_quantizer_matrix[i] = s->inter_matrix[i];
305 render->info.mpeg.forward_reference = VDP_INVALID_HANDLE;
306 render->info.mpeg.backward_reference = VDP_INVALID_HANDLE;
308 switch(s->pict_type){
309 case AV_PICTURE_TYPE_B:
310 next = (struct vdpau_render_state *)s->next_picture.f.data[0];
312 render->info.mpeg.backward_reference = next->surface;
313 // no return here, going to set forward prediction
314 case AV_PICTURE_TYPE_P:
315 last = (struct vdpau_render_state *)s->last_picture.f.data[0];
316 if (!last) // FIXME: Does this test make sense?
317 last = render; // predict second field from the first
318 render->info.mpeg.forward_reference = last->surface;
321 ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size);
323 render->info.mpeg.slice_count = slice_count;
326 ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
327 render->bitstream_buffers_used = 0;
329 #endif /* CONFIG_MPEG_VDPAU_DECODER || CONFIG_MPEG1_VDPAU_DECODER */
331 #if CONFIG_VC1_VDPAU_DECODER
332 void ff_vdpau_vc1_decode_picture(MpegEncContext *s, const uint8_t *buf,
335 VC1Context *v = s->avctx->priv_data;
336 struct vdpau_render_state *render, *last, *next;
338 render = (struct vdpau_render_state *)s->current_picture.f.data[0];
341 /* fill LvPictureInfoVC1 struct */
342 render->info.vc1.frame_coding_mode = v->fcm ? v->fcm + 1 : 0;
343 render->info.vc1.postprocflag = v->postprocflag;
344 render->info.vc1.pulldown = v->broadcast;
345 render->info.vc1.interlace = v->interlace;
346 render->info.vc1.tfcntrflag = v->tfcntrflag;
347 render->info.vc1.finterpflag = v->finterpflag;
348 render->info.vc1.psf = v->psf;
349 render->info.vc1.dquant = v->dquant;
350 render->info.vc1.panscan_flag = v->panscanflag;
351 render->info.vc1.refdist_flag = v->refdist_flag;
352 render->info.vc1.quantizer = v->quantizer_mode;
353 render->info.vc1.extended_mv = v->extended_mv;
354 render->info.vc1.extended_dmv = v->extended_dmv;
355 render->info.vc1.overlap = v->overlap;
356 render->info.vc1.vstransform = v->vstransform;
357 render->info.vc1.loopfilter = v->s.loop_filter;
358 render->info.vc1.fastuvmc = v->fastuvmc;
359 render->info.vc1.range_mapy_flag = v->range_mapy_flag;
360 render->info.vc1.range_mapy = v->range_mapy;
361 render->info.vc1.range_mapuv_flag = v->range_mapuv_flag;
362 render->info.vc1.range_mapuv = v->range_mapuv;
363 /* Specific to simple/main profile only */
364 render->info.vc1.multires = v->multires;
365 render->info.vc1.syncmarker = v->resync_marker;
366 render->info.vc1.rangered = v->rangered | (v->rangeredfrm << 1);
367 render->info.vc1.maxbframes = v->s.max_b_frames;
369 render->info.vc1.deblockEnable = v->postprocflag & 1;
370 render->info.vc1.pquant = v->pq;
372 render->info.vc1.forward_reference = VDP_INVALID_HANDLE;
373 render->info.vc1.backward_reference = VDP_INVALID_HANDLE;
376 render->info.vc1.picture_type = 4;
378 render->info.vc1.picture_type = s->pict_type - 1 + s->pict_type / 3;
380 switch(s->pict_type){
381 case AV_PICTURE_TYPE_B:
382 next = (struct vdpau_render_state *)s->next_picture.f.data[0];
384 render->info.vc1.backward_reference = next->surface;
385 // no break here, going to set forward prediction
386 case AV_PICTURE_TYPE_P:
387 last = (struct vdpau_render_state *)s->last_picture.f.data[0];
388 if (!last) // FIXME: Does this test make sense?
389 last = render; // predict second field from the first
390 render->info.vc1.forward_reference = last->surface;
393 ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size);
395 render->info.vc1.slice_count = 1;
397 ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
398 render->bitstream_buffers_used = 0;
400 #endif /* (CONFIG_VC1_VDPAU_DECODER */
402 #if CONFIG_MPEG4_VDPAU_DECODER
403 void ff_vdpau_mpeg4_decode_picture(Mpeg4DecContext *ctx, const uint8_t *buf,
406 MpegEncContext *s = &ctx->m;
407 struct vdpau_render_state *render, *last, *next;
410 if (!s->current_picture_ptr) return;
412 render = (struct vdpau_render_state *)s->current_picture_ptr->f.data[0];
415 /* fill VdpPictureInfoMPEG4Part2 struct */
416 render->info.mpeg4.trd[0] = s->pp_time;
417 render->info.mpeg4.trb[0] = s->pb_time;
418 render->info.mpeg4.trd[1] = s->pp_field_time >> 1;
419 render->info.mpeg4.trb[1] = s->pb_field_time >> 1;
420 render->info.mpeg4.vop_time_increment_resolution = s->avctx->time_base.den;
421 render->info.mpeg4.vop_coding_type = 0;
422 render->info.mpeg4.vop_fcode_forward = s->f_code;
423 render->info.mpeg4.vop_fcode_backward = s->b_code;
424 render->info.mpeg4.resync_marker_disable = !ctx->resync_marker;
425 render->info.mpeg4.interlaced = !s->progressive_sequence;
426 render->info.mpeg4.quant_type = s->mpeg_quant;
427 render->info.mpeg4.quarter_sample = s->quarter_sample;
428 render->info.mpeg4.short_video_header = s->avctx->codec->id == AV_CODEC_ID_H263;
429 render->info.mpeg4.rounding_control = s->no_rounding;
430 render->info.mpeg4.alternate_vertical_scan_flag = s->alternate_scan;
431 render->info.mpeg4.top_field_first = s->top_field_first;
432 for (i = 0; i < 64; ++i) {
433 render->info.mpeg4.intra_quantizer_matrix[i] = s->intra_matrix[i];
434 render->info.mpeg4.non_intra_quantizer_matrix[i] = s->inter_matrix[i];
436 render->info.mpeg4.forward_reference = VDP_INVALID_HANDLE;
437 render->info.mpeg4.backward_reference = VDP_INVALID_HANDLE;
439 switch (s->pict_type) {
440 case AV_PICTURE_TYPE_B:
441 next = (struct vdpau_render_state *)s->next_picture.f.data[0];
443 render->info.mpeg4.backward_reference = next->surface;
444 render->info.mpeg4.vop_coding_type = 2;
445 // no break here, going to set forward prediction
446 case AV_PICTURE_TYPE_P:
447 last = (struct vdpau_render_state *)s->last_picture.f.data[0];
449 render->info.mpeg4.forward_reference = last->surface;
452 ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size);
454 ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
455 render->bitstream_buffers_used = 0;
457 #endif /* CONFIG_MPEG4_VDPAU_DECODER */
459 int av_vdpau_get_profile(AVCodecContext *avctx, VdpDecoderProfile *profile)
461 #define PROFILE(prof) \
467 switch (avctx->codec_id) {
468 case AV_CODEC_ID_MPEG1VIDEO: PROFILE(VDP_DECODER_PROFILE_MPEG1);
469 case AV_CODEC_ID_MPEG2VIDEO:
470 switch (avctx->profile) {
471 case FF_PROFILE_MPEG2_MAIN: PROFILE(VDP_DECODER_PROFILE_MPEG2_MAIN);
472 case FF_PROFILE_MPEG2_SIMPLE: PROFILE(VDP_DECODER_PROFILE_MPEG2_SIMPLE);
473 default: return AVERROR(EINVAL);
475 case AV_CODEC_ID_H263: PROFILE(VDP_DECODER_PROFILE_MPEG4_PART2_ASP);
476 case AV_CODEC_ID_MPEG4:
477 switch (avctx->profile) {
478 case FF_PROFILE_MPEG4_SIMPLE: PROFILE(VDP_DECODER_PROFILE_MPEG4_PART2_SP);
479 case FF_PROFILE_MPEG4_ADVANCED_SIMPLE: PROFILE(VDP_DECODER_PROFILE_MPEG4_PART2_ASP);
480 default: return AVERROR(EINVAL);
482 case AV_CODEC_ID_H264:
483 switch (avctx->profile) {
484 case FF_PROFILE_H264_CONSTRAINED_BASELINE:
485 case FF_PROFILE_H264_BASELINE: PROFILE(VDP_DECODER_PROFILE_H264_BASELINE);
486 case FF_PROFILE_H264_MAIN: PROFILE(VDP_DECODER_PROFILE_H264_MAIN);
487 case FF_PROFILE_H264_HIGH: PROFILE(VDP_DECODER_PROFILE_H264_HIGH);
488 default: return AVERROR(EINVAL);
490 case AV_CODEC_ID_WMV3:
491 case AV_CODEC_ID_VC1:
492 switch (avctx->profile) {
493 case FF_PROFILE_VC1_SIMPLE: PROFILE(VDP_DECODER_PROFILE_VC1_SIMPLE);
494 case FF_PROFILE_VC1_MAIN: PROFILE(VDP_DECODER_PROFILE_VC1_MAIN);
495 case FF_PROFILE_VC1_ADVANCED: PROFILE(VDP_DECODER_PROFILE_VC1_ADVANCED);
496 default: return AVERROR(EINVAL);
499 return AVERROR(EINVAL);
502 AVVDPAUContext *av_vdpau_alloc_context(void)
504 return av_mallocz(sizeof(AVVDPAUContext));