2 * This file is part of Libav.
4 * Libav is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * Libav is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with Libav; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 #include "libavutil/avassert.h"
20 #include "libavutil/common.h"
21 #include "libavutil/pixdesc.h"
26 #include "vaapi_decode.h"
29 int ff_vaapi_decode_make_param_buffer(AVCodecContext *avctx,
30 VAAPIDecodePicture *pic,
35 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
39 av_assert0(pic->nb_param_buffers + 1 <= MAX_PARAM_BUFFERS);
41 vas = vaCreateBuffer(ctx->hwctx->display, ctx->va_context,
42 type, size, 1, (void*)data, &buffer);
43 if (vas != VA_STATUS_SUCCESS) {
44 av_log(avctx, AV_LOG_ERROR, "Failed to create parameter "
45 "buffer (type %d): %d (%s).\n",
46 type, vas, vaErrorStr(vas));
50 pic->param_buffers[pic->nb_param_buffers++] = buffer;
52 av_log(avctx, AV_LOG_DEBUG, "Param buffer (type %d, %zu bytes) "
53 "is %#x.\n", type, size, buffer);
58 int ff_vaapi_decode_make_slice_buffer(AVCodecContext *avctx,
59 VAAPIDecodePicture *pic,
60 const void *params_data,
62 const void *slice_data,
65 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
69 av_assert0(pic->nb_slices <= pic->slices_allocated);
70 if (pic->nb_slices == pic->slices_allocated) {
71 if (pic->slices_allocated > 0)
72 pic->slices_allocated *= 2;
74 pic->slices_allocated = 64;
77 av_realloc_array(pic->slice_buffers,
78 pic->slices_allocated,
79 2 * sizeof(*pic->slice_buffers));
80 if (!pic->slice_buffers)
81 return AVERROR(ENOMEM);
83 av_assert0(pic->nb_slices + 1 <= pic->slices_allocated);
85 index = 2 * pic->nb_slices;
87 vas = vaCreateBuffer(ctx->hwctx->display, ctx->va_context,
88 VASliceParameterBufferType,
89 params_size, 1, (void*)params_data,
90 &pic->slice_buffers[index]);
91 if (vas != VA_STATUS_SUCCESS) {
92 av_log(avctx, AV_LOG_ERROR, "Failed to create slice "
93 "parameter buffer: %d (%s).\n", vas, vaErrorStr(vas));
97 av_log(avctx, AV_LOG_DEBUG, "Slice %d param buffer (%zu bytes) "
98 "is %#x.\n", pic->nb_slices, params_size,
99 pic->slice_buffers[index]);
101 vas = vaCreateBuffer(ctx->hwctx->display, ctx->va_context,
102 VASliceDataBufferType,
103 slice_size, 1, (void*)slice_data,
104 &pic->slice_buffers[index + 1]);
105 if (vas != VA_STATUS_SUCCESS) {
106 av_log(avctx, AV_LOG_ERROR, "Failed to create slice "
107 "data buffer (size %zu): %d (%s).\n",
108 slice_size, vas, vaErrorStr(vas));
109 vaDestroyBuffer(ctx->hwctx->display,
110 pic->slice_buffers[index]);
114 av_log(avctx, AV_LOG_DEBUG, "Slice %d data buffer (%zu bytes) "
115 "is %#x.\n", pic->nb_slices, slice_size,
116 pic->slice_buffers[index + 1]);
122 static void ff_vaapi_decode_destroy_buffers(AVCodecContext *avctx,
123 VAAPIDecodePicture *pic)
125 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
129 for (i = 0; i < pic->nb_param_buffers; i++) {
130 vas = vaDestroyBuffer(ctx->hwctx->display,
131 pic->param_buffers[i]);
132 if (vas != VA_STATUS_SUCCESS) {
133 av_log(avctx, AV_LOG_ERROR, "Failed to destroy "
134 "parameter buffer %#x: %d (%s).\n",
135 pic->param_buffers[i], vas, vaErrorStr(vas));
139 for (i = 0; i < 2 * pic->nb_slices; i++) {
140 vas = vaDestroyBuffer(ctx->hwctx->display,
141 pic->slice_buffers[i]);
142 if (vas != VA_STATUS_SUCCESS) {
143 av_log(avctx, AV_LOG_ERROR, "Failed to destroy slice "
144 "slice buffer %#x: %d (%s).\n",
145 pic->slice_buffers[i], vas, vaErrorStr(vas));
150 int ff_vaapi_decode_issue(AVCodecContext *avctx,
151 VAAPIDecodePicture *pic)
153 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
157 av_log(avctx, AV_LOG_DEBUG, "Decode to surface %#x.\n",
158 pic->output_surface);
160 vas = vaBeginPicture(ctx->hwctx->display, ctx->va_context,
161 pic->output_surface);
162 if (vas != VA_STATUS_SUCCESS) {
163 av_log(avctx, AV_LOG_ERROR, "Failed to begin picture decode "
164 "issue: %d (%s).\n", vas, vaErrorStr(vas));
166 goto fail_with_picture;
169 vas = vaRenderPicture(ctx->hwctx->display, ctx->va_context,
170 pic->param_buffers, pic->nb_param_buffers);
171 if (vas != VA_STATUS_SUCCESS) {
172 av_log(avctx, AV_LOG_ERROR, "Failed to upload decode "
173 "parameters: %d (%s).\n", vas, vaErrorStr(vas));
175 goto fail_with_picture;
178 vas = vaRenderPicture(ctx->hwctx->display, ctx->va_context,
179 pic->slice_buffers, 2 * pic->nb_slices);
180 if (vas != VA_STATUS_SUCCESS) {
181 av_log(avctx, AV_LOG_ERROR, "Failed to upload slices: "
182 "%d (%s).\n", vas, vaErrorStr(vas));
184 goto fail_with_picture;
187 vas = vaEndPicture(ctx->hwctx->display, ctx->va_context);
188 if (vas != VA_STATUS_SUCCESS) {
189 av_log(avctx, AV_LOG_ERROR, "Failed to end picture decode "
190 "issue: %d (%s).\n", vas, vaErrorStr(vas));
192 if (HAVE_VAAPI_1 || ctx->hwctx->driver_quirks &
193 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS)
199 if (HAVE_VAAPI_1 || ctx->hwctx->driver_quirks &
200 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS)
201 ff_vaapi_decode_destroy_buffers(avctx, pic);
203 pic->nb_param_buffers = 0;
205 pic->slices_allocated = 0;
206 av_freep(&pic->slice_buffers);
211 vas = vaEndPicture(ctx->hwctx->display, ctx->va_context);
212 if (vas != VA_STATUS_SUCCESS) {
213 av_log(avctx, AV_LOG_ERROR, "Failed to end picture decode "
214 "after error: %d (%s).\n", vas, vaErrorStr(vas));
217 ff_vaapi_decode_destroy_buffers(avctx, pic);
222 int ff_vaapi_decode_cancel(AVCodecContext *avctx,
223 VAAPIDecodePicture *pic)
225 ff_vaapi_decode_destroy_buffers(avctx, pic);
227 pic->nb_param_buffers = 0;
229 pic->slices_allocated = 0;
230 av_freep(&pic->slice_buffers);
235 static const struct {
236 enum AVCodecID codec_id;
238 VAProfile va_profile;
239 } vaapi_profile_map[] = {
240 #define MAP(c, p, v) { AV_CODEC_ID_ ## c, FF_PROFILE_ ## p, VAProfile ## v }
241 MAP(MPEG2VIDEO, MPEG2_SIMPLE, MPEG2Simple ),
242 MAP(MPEG2VIDEO, MPEG2_MAIN, MPEG2Main ),
243 MAP(H263, UNKNOWN, H263Baseline),
244 MAP(MPEG4, MPEG4_SIMPLE, MPEG4Simple ),
245 MAP(MPEG4, MPEG4_ADVANCED_SIMPLE,
246 MPEG4AdvancedSimple),
247 MAP(MPEG4, MPEG4_MAIN, MPEG4Main ),
248 MAP(H264, H264_CONSTRAINED_BASELINE,
249 H264ConstrainedBaseline),
250 MAP(H264, H264_MAIN, H264Main ),
251 MAP(H264, H264_HIGH, H264High ),
252 #if VA_CHECK_VERSION(0, 37, 0)
253 MAP(HEVC, HEVC_MAIN, HEVCMain ),
254 MAP(HEVC, HEVC_MAIN_10, HEVCMain10 ),
256 MAP(WMV3, VC1_SIMPLE, VC1Simple ),
257 MAP(WMV3, VC1_MAIN, VC1Main ),
258 MAP(WMV3, VC1_COMPLEX, VC1Advanced ),
259 MAP(WMV3, VC1_ADVANCED, VC1Advanced ),
260 MAP(VC1, VC1_SIMPLE, VC1Simple ),
261 MAP(VC1, VC1_MAIN, VC1Main ),
262 MAP(VC1, VC1_COMPLEX, VC1Advanced ),
263 MAP(VC1, VC1_ADVANCED, VC1Advanced ),
264 #if VA_CHECK_VERSION(0, 35, 0)
265 MAP(VP8, UNKNOWN, VP8Version0_3 ),
267 #if VA_CHECK_VERSION(0, 38, 0)
268 MAP(VP9, VP9_0, VP9Profile0 ),
274 * Set *va_config and the frames_ref fields from the current codec parameters
277 static int vaapi_decode_make_config(AVCodecContext *avctx,
278 AVBufferRef *device_ref,
279 VAConfigID *va_config,
280 AVBufferRef *frames_ref)
282 AVVAAPIHWConfig *hwconfig = NULL;
283 AVHWFramesConstraints *constraints = NULL;
286 const AVCodecDescriptor *codec_desc;
287 VAProfile *profile_list = NULL, matched_va_profile;
288 int profile_count, exact_match, matched_ff_profile;
289 const AVPixFmtDescriptor *sw_desc, *desc;
291 AVHWDeviceContext *device = (AVHWDeviceContext*)device_ref->data;
292 AVVAAPIDeviceContext *hwctx = device->hwctx;
294 codec_desc = avcodec_descriptor_get(avctx->codec_id);
296 err = AVERROR(EINVAL);
300 profile_count = vaMaxNumProfiles(hwctx->display);
301 profile_list = av_malloc_array(profile_count,
304 err = AVERROR(ENOMEM);
308 vas = vaQueryConfigProfiles(hwctx->display,
309 profile_list, &profile_count);
310 if (vas != VA_STATUS_SUCCESS) {
311 av_log(avctx, AV_LOG_ERROR, "Failed to query profiles: "
312 "%d (%s).\n", vas, vaErrorStr(vas));
313 err = AVERROR(ENOSYS);
317 matched_va_profile = VAProfileNone;
320 for (i = 0; i < FF_ARRAY_ELEMS(vaapi_profile_map); i++) {
321 int profile_match = 0;
322 if (avctx->codec_id != vaapi_profile_map[i].codec_id)
324 if (avctx->profile == vaapi_profile_map[i].codec_profile ||
325 vaapi_profile_map[i].codec_profile == FF_PROFILE_UNKNOWN)
327 for (j = 0; j < profile_count; j++) {
328 if (vaapi_profile_map[i].va_profile == profile_list[j]) {
329 exact_match = profile_match;
333 if (j < profile_count) {
334 matched_va_profile = vaapi_profile_map[i].va_profile;
335 matched_ff_profile = vaapi_profile_map[i].codec_profile;
340 av_freep(&profile_list);
342 if (matched_va_profile == VAProfileNone) {
343 av_log(avctx, AV_LOG_ERROR, "No support for codec %s "
344 "profile %d.\n", codec_desc->name, avctx->profile);
345 err = AVERROR(ENOSYS);
349 if (avctx->hwaccel_flags &
350 AV_HWACCEL_FLAG_ALLOW_PROFILE_MISMATCH) {
351 av_log(avctx, AV_LOG_VERBOSE, "Codec %s profile %d not "
352 "supported for hardware decode.\n",
353 codec_desc->name, avctx->profile);
354 av_log(avctx, AV_LOG_WARNING, "Using possibly-"
355 "incompatible profile %d instead.\n",
358 av_log(avctx, AV_LOG_VERBOSE, "Codec %s profile %d not "
359 "supported for hardware decode.\n",
360 codec_desc->name, avctx->profile);
361 err = AVERROR(EINVAL);
366 vas = vaCreateConfig(hwctx->display, matched_va_profile,
367 VAEntrypointVLD, NULL, 0,
369 if (vas != VA_STATUS_SUCCESS) {
370 av_log(avctx, AV_LOG_ERROR, "Failed to create decode "
371 "configuration: %d (%s).\n", vas, vaErrorStr(vas));
376 hwconfig = av_hwdevice_hwconfig_alloc(device_ref);
378 err = AVERROR(ENOMEM);
381 hwconfig->config_id = *va_config;
384 av_hwdevice_get_hwframe_constraints(device_ref, hwconfig);
386 err = AVERROR(ENOMEM);
390 if (avctx->coded_width < constraints->min_width ||
391 avctx->coded_height < constraints->min_height ||
392 avctx->coded_width > constraints->max_width ||
393 avctx->coded_height > constraints->max_height) {
394 av_log(avctx, AV_LOG_ERROR, "Hardware does not support image "
395 "size %dx%d (constraints: width %d-%d height %d-%d).\n",
396 avctx->coded_width, avctx->coded_height,
397 constraints->min_width, constraints->max_width,
398 constraints->min_height, constraints->max_height);
399 err = AVERROR(EINVAL);
402 if (!constraints->valid_sw_formats ||
403 constraints->valid_sw_formats[0] == AV_PIX_FMT_NONE) {
404 av_log(avctx, AV_LOG_ERROR, "Hardware does not offer any "
405 "usable surface formats.\n");
406 err = AVERROR(EINVAL);
411 AVHWFramesContext *frames = (AVHWFramesContext *)frames_ref->data;
413 frames->format = AV_PIX_FMT_VAAPI;
414 frames->width = avctx->coded_width;
415 frames->height = avctx->coded_height;
417 // Find the first format in the list which matches the expected
418 // bit depth and subsampling. If none are found (this can happen
419 // when 10-bit streams are decoded to 8-bit surfaces, for example)
420 // then just take the first format on the list.
421 frames->sw_format = constraints->valid_sw_formats[0];
422 sw_desc = av_pix_fmt_desc_get(avctx->sw_pix_fmt);
423 for (i = 0; constraints->valid_sw_formats[i] != AV_PIX_FMT_NONE; i++) {
424 desc = av_pix_fmt_desc_get(constraints->valid_sw_formats[i]);
425 if (desc->nb_components != sw_desc->nb_components ||
426 desc->log2_chroma_w != sw_desc->log2_chroma_w ||
427 desc->log2_chroma_h != sw_desc->log2_chroma_h)
429 for (j = 0; j < desc->nb_components; j++) {
430 if (desc->comp[j].depth != sw_desc->comp[j].depth)
433 if (j < desc->nb_components)
435 frames->sw_format = constraints->valid_sw_formats[i];
439 frames->initial_pool_size = 1;
440 // Add per-codec number of surfaces used for storing reference frames.
441 switch (avctx->codec_id) {
442 case AV_CODEC_ID_H264:
443 case AV_CODEC_ID_HEVC:
444 frames->initial_pool_size += 16;
446 case AV_CODEC_ID_VP9:
447 frames->initial_pool_size += 8;
449 case AV_CODEC_ID_VP8:
450 frames->initial_pool_size += 3;
453 frames->initial_pool_size += 2;
457 av_hwframe_constraints_free(&constraints);
463 av_hwframe_constraints_free(&constraints);
465 if (*va_config != VA_INVALID_ID) {
466 vaDestroyConfig(hwctx->display, *va_config);
467 *va_config = VA_INVALID_ID;
469 av_freep(&profile_list);
473 int ff_vaapi_common_frame_params(AVCodecContext *avctx,
474 AVBufferRef *hw_frames_ctx)
476 AVHWFramesContext *hw_frames = (AVHWFramesContext *)hw_frames_ctx->data;
477 AVHWDeviceContext *device_ctx = hw_frames->device_ctx;
478 AVVAAPIDeviceContext *hwctx;
479 VAConfigID va_config = VA_INVALID_ID;
482 if (device_ctx->type != AV_HWDEVICE_TYPE_VAAPI)
483 return AVERROR(EINVAL);
484 hwctx = device_ctx->hwctx;
486 err = vaapi_decode_make_config(avctx, hw_frames->device_ref, &va_config,
491 if (va_config != VA_INVALID_ID)
492 vaDestroyConfig(hwctx->display, va_config);
497 int ff_vaapi_decode_init(AVCodecContext *avctx)
499 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
503 ctx->va_config = VA_INVALID_ID;
504 ctx->va_context = VA_INVALID_ID;
506 #if FF_API_VAAPI_CONTEXT
507 if (avctx->hwaccel_context) {
508 av_log(avctx, AV_LOG_WARNING, "Using deprecated struct "
509 "vaapi_context in decode.\n");
511 ctx->have_old_context = 1;
512 ctx->old_context = avctx->hwaccel_context;
514 // Really we only want the VAAPI device context, but this
515 // allocates a whole generic device context because we don't
516 // have any other way to determine how big it should be.
518 av_hwdevice_ctx_alloc(AV_HWDEVICE_TYPE_VAAPI);
519 if (!ctx->device_ref) {
520 err = AVERROR(ENOMEM);
523 ctx->device = (AVHWDeviceContext*)ctx->device_ref->data;
524 ctx->hwctx = ctx->device->hwctx;
526 ctx->hwctx->display = ctx->old_context->display;
528 // The old VAAPI decode setup assumed this quirk was always
529 // present, so set it here to avoid the behaviour changing.
530 ctx->hwctx->driver_quirks =
531 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS;
536 #if FF_API_VAAPI_CONTEXT
537 if (ctx->have_old_context) {
538 ctx->va_config = ctx->old_context->config_id;
539 ctx->va_context = ctx->old_context->context_id;
541 av_log(avctx, AV_LOG_DEBUG, "Using user-supplied decoder "
542 "context: %#x/%#x.\n", ctx->va_config, ctx->va_context);
546 err = ff_decode_get_hw_frames_ctx(avctx, AV_HWDEVICE_TYPE_VAAPI);
550 ctx->frames = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
551 ctx->hwfc = ctx->frames->hwctx;
552 ctx->device = ctx->frames->device_ctx;
553 ctx->hwctx = ctx->device->hwctx;
555 err = vaapi_decode_make_config(avctx, ctx->frames->device_ref,
556 &ctx->va_config, avctx->hw_frames_ctx);
560 vas = vaCreateContext(ctx->hwctx->display, ctx->va_config,
561 avctx->coded_width, avctx->coded_height,
563 ctx->hwfc->surface_ids,
564 ctx->hwfc->nb_surfaces,
566 if (vas != VA_STATUS_SUCCESS) {
567 av_log(avctx, AV_LOG_ERROR, "Failed to create decode "
568 "context: %d (%s).\n", vas, vaErrorStr(vas));
573 av_log(avctx, AV_LOG_DEBUG, "Decode context initialised: "
574 "%#x/%#x.\n", ctx->va_config, ctx->va_context);
575 #if FF_API_VAAPI_CONTEXT
582 ff_vaapi_decode_uninit(avctx);
586 int ff_vaapi_decode_uninit(AVCodecContext *avctx)
588 VAAPIDecodeContext *ctx = avctx->internal->hwaccel_priv_data;
591 #if FF_API_VAAPI_CONTEXT
592 if (ctx->have_old_context) {
593 av_buffer_unref(&ctx->device_ref);
597 if (ctx->va_context != VA_INVALID_ID) {
598 vas = vaDestroyContext(ctx->hwctx->display, ctx->va_context);
599 if (vas != VA_STATUS_SUCCESS) {
600 av_log(avctx, AV_LOG_ERROR, "Failed to destroy decode "
601 "context %#x: %d (%s).\n",
602 ctx->va_context, vas, vaErrorStr(vas));
605 if (ctx->va_config != VA_INVALID_ID) {
606 vas = vaDestroyConfig(ctx->hwctx->display, ctx->va_config);
607 if (vas != VA_STATUS_SUCCESS) {
608 av_log(avctx, AV_LOG_ERROR, "Failed to destroy decode "
609 "configuration %#x: %d (%s).\n",
610 ctx->va_config, vas, vaErrorStr(vas));
614 #if FF_API_VAAPI_CONTEXT