git.sesse.net Git - ffmpeg/blob - libavcodec/vda_h264.c

   1 /*
   2  * VDA H264 HW acceleration.
   3  *
   4  * copyright (c) 2011 Sebastien Zwickert
   5  *
   6  * This file is part of FFmpeg.
   7  *
   8  * FFmpeg is free software; you can redistribute it and/or
   9  * modify it under the terms of the GNU Lesser General Public
  10  * License as published by the Free Software Foundation; either
  11  * version 2.1 of the License, or (at your option) any later version.
  12  *
  13  * FFmpeg is distributed in the hope that it will be useful,
  14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  16  * Lesser General Public License for more details.
  17  *
  18  * You should have received a copy of the GNU Lesser General Public
  19  * License along with FFmpeg; if not, write to the Free Software
  20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21  */
  22
  23 #include <CoreFoundation/CFDictionary.h>
  24 #include <CoreFoundation/CFNumber.h>
  25 #include <CoreFoundation/CFData.h>
  26
  27 #include "vda.h"
  28 #include "libavutil/avutil.h"
  29 #include "h264.h"
  30
  31 struct vda_buffer {
  32     CVPixelBufferRef cv_buffer;
  33 };
  34 #include "internal.h"
  35 #include "vda_internal.h"
  36
  37 typedef struct VDAContext {
  38     // The current bitstream buffer.
  39     uint8_t             *bitstream;
  40
  41     // The current size of the bitstream.
  42     int                  bitstream_size;
  43
  44     // The reference size used for fast reallocation.
  45     int                  allocated_size;
  46
  47     CVImageBufferRef frame;
  48 } VDAContext;
  49
  50 /* Decoder callback that adds the vda frame to the queue in display order. */
  51 static void vda_decoder_callback(void *vda_hw_ctx,
  52                                  CFDictionaryRef user_info,
  53                                  OSStatus status,
  54                                  uint32_t infoFlags,
  55                                  CVImageBufferRef image_buffer)
  56 {
  57     struct vda_context *vda_ctx = vda_hw_ctx;
  58
  59     if (infoFlags & kVDADecodeInfo_FrameDropped)
  60         vda_ctx->cv_buffer = NULL;
  61
  62     if (!image_buffer)
  63         return;
  64
  65     if (vda_ctx->cv_pix_fmt_type != CVPixelBufferGetPixelFormatType(image_buffer))
  66         return;
  67
  68     vda_ctx->cv_buffer = CVPixelBufferRetain(image_buffer);
  69 }
  70
  71 static int vda_sync_decode(VDAContext *ctx, struct vda_context *vda_ctx)
  72 {
  73     OSStatus status;
  74     CFDataRef coded_frame;
  75     uint32_t flush_flags = 1 << 0; ///< kVDADecoderFlush_emitFrames
  76
  77     coded_frame = CFDataCreate(kCFAllocatorDefault,
  78                                ctx->bitstream,
  79                                ctx->bitstream_size);
  80
  81     status = VDADecoderDecode(vda_ctx->decoder, 0, coded_frame, NULL);
  82
  83     if (kVDADecoderNoErr == status)
  84         status = VDADecoderFlush(vda_ctx->decoder, flush_flags);
  85
  86     CFRelease(coded_frame);
  87
  88     return status;
  89 }
  90
  91
  92 static int vda_old_h264_start_frame(AVCodecContext *avctx,
  93                                 av_unused const uint8_t *buffer,
  94                                 av_unused uint32_t size)
  95 {
  96     VDAContext *vda = avctx->internal->hwaccel_priv_data;
  97     struct vda_context *vda_ctx = avctx->hwaccel_context;
  98
  99     if (!vda_ctx->decoder)
 100         return -1;
 101
 102     vda->bitstream_size = 0;
 103
 104     return 0;
 105 }
 106
 107 static int vda_old_h264_decode_slice(AVCodecContext *avctx,
 108                                  const uint8_t *buffer,
 109                                  uint32_t size)
 110 {
 111     VDAContext *vda             = avctx->internal->hwaccel_priv_data;
 112     struct vda_context *vda_ctx = avctx->hwaccel_context;
 113     void *tmp;
 114
 115     if (!vda_ctx->decoder)
 116         return -1;
 117
 118     tmp = av_fast_realloc(vda->bitstream,
 119                           &vda->allocated_size,
 120                           vda->bitstream_size + size + 4);
 121     if (!tmp)
 122         return AVERROR(ENOMEM);
 123
 124     vda->bitstream = tmp;
 125
 126     AV_WB32(vda->bitstream + vda->bitstream_size, size);
 127     memcpy(vda->bitstream + vda->bitstream_size + 4, buffer, size);
 128
 129     vda->bitstream_size += size + 4;
 130
 131     return 0;
 132 }
 133
 134 static void vda_h264_release_buffer(void *opaque, uint8_t *data)
 135 {
 136     struct vda_buffer *context = opaque;
 137     CVPixelBufferRelease(context->cv_buffer);
 138     av_free(context);
 139 }
 140
 141 static int vda_old_h264_end_frame(AVCodecContext *avctx)
 142 {
 143     H264Context *h                      = avctx->priv_data;
 144     VDAContext *vda                     = avctx->internal->hwaccel_priv_data;
 145     struct vda_context *vda_ctx         = avctx->hwaccel_context;
 146     AVFrame *frame                      = h->cur_pic_ptr->f;
 147     struct vda_buffer *context;
 148     AVBufferRef *buffer;
 149     int status;
 150
 151     if (!vda_ctx->decoder || !vda->bitstream)
 152         return -1;
 153
 154     status = vda_sync_decode(vda, vda_ctx);
 155     frame->data[3] = (void*)vda_ctx->cv_buffer;
 156
 157     if (status)
 158         av_log(avctx, AV_LOG_ERROR, "Failed to decode frame (%d)\n", status);
 159
 160     if (!vda_ctx->use_ref_buffer || status)
 161         return status;
 162
 163     context = av_mallocz(sizeof(*context));
 164     buffer = av_buffer_create(NULL, 0, vda_h264_release_buffer, context, 0);
 165     if (!context || !buffer) {
 166         CVPixelBufferRelease(vda_ctx->cv_buffer);
 167         av_free(context);
 168         return -1;
 169     }
 170
 171     context->cv_buffer = vda_ctx->cv_buffer;
 172     frame->buf[3] = buffer;
 173
 174     return status;
 175 }
 176
 177 int ff_vda_create_decoder(struct vda_context *vda_ctx,
 178                           uint8_t *extradata,
 179                           int extradata_size)
 180 {
 181     OSStatus status;
 182     CFNumberRef height;
 183     CFNumberRef width;
 184     CFNumberRef format;
 185     CFDataRef avc_data;
 186     CFMutableDictionaryRef config_info;
 187     CFMutableDictionaryRef buffer_attributes;
 188     CFMutableDictionaryRef io_surface_properties;
 189     CFNumberRef cv_pix_fmt;
 190
 191     vda_ctx->priv_bitstream = NULL;
 192     vda_ctx->priv_allocated_size = 0;
 193
 194     /* Each VCL NAL in the bitstream sent to the decoder
 195      * is preceded by a 4 bytes length header.
 196      * Change the avcC atom header if needed, to signal headers of 4 bytes. */
 197     if (extradata_size >= 4 && (extradata[4] & 0x03) != 0x03) {
 198         uint8_t *rw_extradata;
 199
 200         if (!(rw_extradata = av_malloc(extradata_size)))
 201             return AVERROR(ENOMEM);
 202
 203         memcpy(rw_extradata, extradata, extradata_size);
 204
 205         rw_extradata[4] |= 0x03;
 206
 207         avc_data = CFDataCreate(kCFAllocatorDefault, rw_extradata, extradata_size);
 208
 209         av_freep(&rw_extradata);
 210     } else {
 211         avc_data = CFDataCreate(kCFAllocatorDefault, extradata, extradata_size);
 212     }
 213
 214     config_info = CFDictionaryCreateMutable(kCFAllocatorDefault,
 215                                             4,
 216                                             &kCFTypeDictionaryKeyCallBacks,
 217                                             &kCFTypeDictionaryValueCallBacks);
 218
 219     height   = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->height);
 220     width    = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->width);
 221     format   = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->format);
 222
 223     CFDictionarySetValue(config_info, kVDADecoderConfiguration_Height, height);
 224     CFDictionarySetValue(config_info, kVDADecoderConfiguration_Width, width);
 225     CFDictionarySetValue(config_info, kVDADecoderConfiguration_SourceFormat, format);
 226     CFDictionarySetValue(config_info, kVDADecoderConfiguration_avcCData, avc_data);
 227
 228     buffer_attributes = CFDictionaryCreateMutable(kCFAllocatorDefault,
 229                                                   2,
 230                                                   &kCFTypeDictionaryKeyCallBacks,
 231                                                   &kCFTypeDictionaryValueCallBacks);
 232     io_surface_properties = CFDictionaryCreateMutable(kCFAllocatorDefault,
 233                                                       0,
 234                                                       &kCFTypeDictionaryKeyCallBacks,
 235                                                       &kCFTypeDictionaryValueCallBacks);
 236     cv_pix_fmt  = CFNumberCreate(kCFAllocatorDefault,
 237                                  kCFNumberSInt32Type,
 238                                  &vda_ctx->cv_pix_fmt_type);
 239     CFDictionarySetValue(buffer_attributes,
 240                          kCVPixelBufferPixelFormatTypeKey,
 241                          cv_pix_fmt);
 242     CFDictionarySetValue(buffer_attributes,
 243                          kCVPixelBufferIOSurfacePropertiesKey,
 244                          io_surface_properties);
 245
 246     status = VDADecoderCreate(config_info,
 247                               buffer_attributes,
 248                               (VDADecoderOutputCallback *)vda_decoder_callback,
 249                               vda_ctx,
 250                               &vda_ctx->decoder);
 251
 252     CFRelease(height);
 253     CFRelease(width);
 254     CFRelease(format);
 255     CFRelease(avc_data);
 256     CFRelease(config_info);
 257     CFRelease(io_surface_properties);
 258     CFRelease(cv_pix_fmt);
 259     CFRelease(buffer_attributes);
 260
 261     return status;
 262 }
 263
 264 int ff_vda_destroy_decoder(struct vda_context *vda_ctx)
 265 {
 266     OSStatus status = kVDADecoderNoErr;
 267
 268     if (vda_ctx->decoder)
 269         status = VDADecoderDestroy(vda_ctx->decoder);
 270
 271     return status;
 272 }
 273
 274 static int vda_h264_uninit(AVCodecContext *avctx)
 275 {
 276     VDAContext *vda = avctx->internal->hwaccel_priv_data;
 277     if (vda) {
 278         av_freep(&vda->bitstream);
 279         if (vda->frame)
 280             CVPixelBufferRelease(vda->frame);
 281     }
 282     return 0;
 283 }
 284
 285 AVHWAccel ff_h264_vda_old_hwaccel = {
 286     .name           = "h264_vda",
 287     .type           = AVMEDIA_TYPE_VIDEO,
 288     .id             = AV_CODEC_ID_H264,
 289     .pix_fmt        = AV_PIX_FMT_VDA_VLD,
 290     .start_frame    = vda_old_h264_start_frame,
 291     .decode_slice   = vda_old_h264_decode_slice,
 292     .end_frame      = vda_old_h264_end_frame,
 293     .uninit         = vda_h264_uninit,
 294     .priv_data_size = sizeof(VDAContext),
 295 };
 296
 297 void ff_vda_output_callback(void *opaque,
 298                             CFDictionaryRef user_info,
 299                             OSStatus status,
 300                             uint32_t infoFlags,
 301                             CVImageBufferRef image_buffer)
 302 {
 303     AVCodecContext *ctx = opaque;
 304     VDAContext *vda = ctx->internal->hwaccel_priv_data;
 305
 306
 307     if (vda->frame) {
 308         CVPixelBufferRelease(vda->frame);
 309         vda->frame = NULL;
 310     }
 311
 312     if (!image_buffer)
 313         return;
 314
 315     vda->frame = CVPixelBufferRetain(image_buffer);
 316 }
 317
 318 static int vda_h264_start_frame(AVCodecContext *avctx,
 319                                 const uint8_t *buffer,
 320                                 uint32_t size)
 321 {
 322     VDAContext *vda = avctx->internal->hwaccel_priv_data;
 323     H264Context *h  = avctx->priv_data;
 324
 325     if (h->is_avc == 1) {
 326         void *tmp;
 327         vda->bitstream_size = 0;
 328         tmp = av_fast_realloc(vda->bitstream,
 329                               &vda->allocated_size,
 330                               size);
 331         vda->bitstream = tmp;
 332         memcpy(vda->bitstream, buffer, size);
 333         vda->bitstream_size = size;
 334     } else {
 335         vda->bitstream_size = 0;
 336     }
 337     return 0;
 338 }
 339
 340 static int vda_h264_decode_slice(AVCodecContext *avctx,
 341                                  const uint8_t *buffer,
 342                                  uint32_t size)
 343 {
 344     VDAContext *vda       = avctx->internal->hwaccel_priv_data;
 345     H264Context *h  = avctx->priv_data;
 346     void *tmp;
 347
 348     if (h->is_avc == 1)
 349         return 0;
 350
 351     tmp = av_fast_realloc(vda->bitstream,
 352                           &vda->allocated_size,
 353                           vda->bitstream_size + size + 4);
 354     if (!tmp)
 355         return AVERROR(ENOMEM);
 356
 357     vda->bitstream = tmp;
 358
 359     AV_WB32(vda->bitstream + vda->bitstream_size, size);
 360     memcpy(vda->bitstream + vda->bitstream_size + 4, buffer, size);
 361
 362     vda->bitstream_size += size + 4;
 363
 364     return 0;
 365 }
 366
 367 static void release_buffer(void *opaque, uint8_t *data)
 368 {
 369     CVImageBufferRef frame = (CVImageBufferRef)data;
 370     CVPixelBufferRelease(frame);
 371 }
 372
 373 static int vda_h264_end_frame(AVCodecContext *avctx)
 374 {
 375     H264Context *h        = avctx->priv_data;
 376     VDAContext *vda       = avctx->internal->hwaccel_priv_data;
 377     AVVDAContext *vda_ctx = avctx->hwaccel_context;
 378     AVFrame *frame        = h->cur_pic_ptr->f;
 379     uint32_t flush_flags  = 1 << 0; ///< kVDADecoderFlush_emitFrames
 380     CFDataRef coded_frame;
 381     OSStatus status;
 382
 383     if (!vda->bitstream_size)
 384         return AVERROR_INVALIDDATA;
 385
 386
 387     coded_frame = CFDataCreate(kCFAllocatorDefault,
 388                                vda->bitstream,
 389                                vda->bitstream_size);
 390
 391     status = VDADecoderDecode(vda_ctx->decoder, 0, coded_frame, NULL);
 392
 393     if (status == kVDADecoderNoErr)
 394         status = VDADecoderFlush(vda_ctx->decoder, flush_flags);
 395
 396     CFRelease(coded_frame);
 397
 398     if (!vda->frame)
 399         return AVERROR_UNKNOWN;
 400
 401     if (status != kVDADecoderNoErr) {
 402         av_log(avctx, AV_LOG_ERROR, "Failed to decode frame (%d)\n", status);
 403         return AVERROR_UNKNOWN;
 404     }
 405
 406     av_buffer_unref(&frame->buf[0]);
 407
 408     frame->buf[0] = av_buffer_create((uint8_t*)vda->frame,
 409                                      sizeof(vda->frame),
 410                                      release_buffer, NULL,
 411                                      AV_BUFFER_FLAG_READONLY);
 412     if (!frame->buf[0])
 413         return AVERROR(ENOMEM);
 414
 415     frame->data[3] = (uint8_t*)vda->frame;
 416     vda->frame = NULL;
 417
 418     return 0;
 419 }
 420
 421 int ff_vda_default_init(AVCodecContext *avctx)
 422 {
 423     AVVDAContext *vda_ctx = avctx->hwaccel_context;
 424     OSStatus status = kVDADecoderNoErr;
 425     CFNumberRef height;
 426     CFNumberRef width;
 427     CFNumberRef format;
 428     CFDataRef avc_data;
 429     CFMutableDictionaryRef config_info;
 430     CFMutableDictionaryRef buffer_attributes;
 431     CFMutableDictionaryRef io_surface_properties;
 432     CFNumberRef cv_pix_fmt;
 433     int32_t fmt = 'avc1', pix_fmt = vda_ctx->cv_pix_fmt_type;
 434
 435     // kCVPixelFormatType_420YpCbCr8Planar;
 436
 437     /* Each VCL NAL in the bitstream sent to the decoder
 438      * is preceded by a 4 bytes length header.
 439      * Change the avcC atom header if needed, to signal headers of 4 bytes. */
 440     if (avctx->extradata_size >= 4 && (avctx->extradata[4] & 0x03) != 0x03) {
 441         uint8_t *rw_extradata;
 442
 443         if (!(rw_extradata = av_malloc(avctx->extradata_size)))
 444             return AVERROR(ENOMEM);
 445
 446         memcpy(rw_extradata, avctx->extradata, avctx->extradata_size);
 447
 448         rw_extradata[4] |= 0x03;
 449
 450         avc_data = CFDataCreate(kCFAllocatorDefault, rw_extradata, avctx->extradata_size);
 451
 452         av_freep(&rw_extradata);
 453     } else {
 454         avc_data = CFDataCreate(kCFAllocatorDefault,
 455                                 avctx->extradata, avctx->extradata_size);
 456     }
 457
 458     config_info = CFDictionaryCreateMutable(kCFAllocatorDefault,
 459                                             4,
 460                                             &kCFTypeDictionaryKeyCallBacks,
 461                                             &kCFTypeDictionaryValueCallBacks);
 462
 463     height = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &avctx->height);
 464     width  = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &avctx->width);
 465     format = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &fmt);
 466     CFDictionarySetValue(config_info, kVDADecoderConfiguration_Height, height);
 467     CFDictionarySetValue(config_info, kVDADecoderConfiguration_Width, width);
 468     CFDictionarySetValue(config_info, kVDADecoderConfiguration_avcCData, avc_data);
 469     CFDictionarySetValue(config_info, kVDADecoderConfiguration_SourceFormat, format);
 470
 471     buffer_attributes = CFDictionaryCreateMutable(kCFAllocatorDefault,
 472                                                   2,
 473                                                   &kCFTypeDictionaryKeyCallBacks,
 474                                                   &kCFTypeDictionaryValueCallBacks);
 475     io_surface_properties = CFDictionaryCreateMutable(kCFAllocatorDefault,
 476                                                       0,
 477                                                       &kCFTypeDictionaryKeyCallBacks,
 478                                                       &kCFTypeDictionaryValueCallBacks);
 479     cv_pix_fmt      = CFNumberCreate(kCFAllocatorDefault,
 480                                      kCFNumberSInt32Type,
 481                                      &pix_fmt);
 482
 483     CFDictionarySetValue(buffer_attributes,
 484                          kCVPixelBufferPixelFormatTypeKey,
 485                          cv_pix_fmt);
 486     CFDictionarySetValue(buffer_attributes,
 487                          kCVPixelBufferIOSurfacePropertiesKey,
 488                          io_surface_properties);
 489
 490     status = VDADecoderCreate(config_info,
 491                               buffer_attributes,
 492                               (VDADecoderOutputCallback *)ff_vda_output_callback,
 493                               avctx,
 494                               &vda_ctx->decoder);
 495
 496     CFRelease(format);
 497     CFRelease(height);
 498     CFRelease(width);
 499     CFRelease(avc_data);
 500     CFRelease(config_info);
 501     CFRelease(cv_pix_fmt);
 502     CFRelease(io_surface_properties);
 503     CFRelease(buffer_attributes);
 504
 505     if (status != kVDADecoderNoErr) {
 506         av_log(avctx, AV_LOG_ERROR, "Cannot initialize VDA %d\n", status);
 507     }
 508
 509     switch (status) {
 510     case kVDADecoderHardwareNotSupportedErr:
 511     case kVDADecoderFormatNotSupportedErr:
 512         return AVERROR(ENOSYS);
 513     case kVDADecoderConfigurationError:
 514         return AVERROR(EINVAL);
 515     case kVDADecoderDecoderFailedErr:
 516         return AVERROR_INVALIDDATA;
 517     case kVDADecoderNoErr:
 518         return 0;
 519     default:
 520         return AVERROR_UNKNOWN;
 521     }
 522 }
 523
 524 static int vda_h264_alloc_frame(AVCodecContext *avctx, AVFrame *frame)
 525 {
 526     frame->width  = avctx->width;
 527     frame->height = avctx->height;
 528     frame->format = avctx->pix_fmt;
 529     frame->buf[0] = av_buffer_alloc(1);
 530
 531     if (!frame->buf[0])
 532         return AVERROR(ENOMEM);
 533     return 0;
 534 }
 535
 536 AVHWAccel ff_h264_vda_hwaccel = {
 537     .name           = "h264_vda",
 538     .type           = AVMEDIA_TYPE_VIDEO,
 539     .id             = AV_CODEC_ID_H264,
 540     .pix_fmt        = AV_PIX_FMT_VDA,
 541     .alloc_frame    = vda_h264_alloc_frame,
 542     .start_frame    = vda_h264_start_frame,
 543     .decode_slice   = vda_h264_decode_slice,
 544     .end_frame      = vda_h264_end_frame,
 545     .uninit         = vda_h264_uninit,
 546     .priv_data_size = sizeof(VDAContext),
 547 };