h264dec: Fix mix of lossless and lossy MBs decoding

[ffmpeg] / libavcodec / hevcdec.c
diff --git a/libavcodec/hevcdec.c b/libavcodec/hevcdec.c

index 147243e3fe52778069c5e7d0b87ad03972c840f1..f6bbb7051e3fa03236c3dc8a5835cb79ffb76a63 100644 (file)
--- a/libavcodec/hevcdec.c
+++ b/libavcodec/hevcdec.c
@@ -35,7 +35,7 @@
  #include "bswapdsp.h"
  #include "bytestream.h"
  #include "cabac_functions.h"
-#include "golomb.h"
+#include "golomb_legacy.h"
  #include "hevc.h"
  #include "hevc_data.h"
  #include "hevcdec.h"
@@ -338,13 +338,14 @@ static void export_stream_params(AVCodecContext *avctx, const HEVCParamSets *ps,
                                   const HEVCSPS *sps)
  {
      const HEVCVPS *vps = (const HEVCVPS*)ps->vps_list[sps->vps_id]->data;
+    const HEVCWindow *ow = &sps->output_window;
      unsigned int num = 0, den = 0;
  
      avctx->pix_fmt             = sps->pix_fmt;
      avctx->coded_width         = sps->width;
      avctx->coded_height        = sps->height;
-    avctx->width               = sps->output_width;
-    avctx->height              = sps->output_height;
+    avctx->width               = sps->width  - ow->left_offset - ow->right_offset;
+    avctx->height              = sps->height - ow->top_offset  - ow->bottom_offset;
      avctx->has_b_frames        = sps->temporal_layer[sps->max_sub_layers - 1].num_reorder_pics;
      avctx->profile             = sps->ptl.general_ptl.profile_idc;
      avctx->level               = sps->ptl.general_ptl.level_idc;
@@ -382,19 +383,24 @@ static void export_stream_params(AVCodecContext *avctx, const HEVCParamSets *ps,
  
  static enum AVPixelFormat get_format(HEVCContext *s, const HEVCSPS *sps)
  {
-    #define HWACCEL_MAX (CONFIG_HEVC_DXVA2_HWACCEL + CONFIG_HEVC_D3D11VA_HWACCEL + CONFIG_HEVC_VDPAU_HWACCEL)
+    #define HWACCEL_MAX (CONFIG_HEVC_DXVA2_HWACCEL + CONFIG_HEVC_D3D11VA_HWACCEL * 2 + \
+                         CONFIG_HEVC_VAAPI_HWACCEL + CONFIG_HEVC_VDPAU_HWACCEL)
      enum AVPixelFormat pix_fmts[HWACCEL_MAX + 2], *fmt = pix_fmts;
  
      if (sps->pix_fmt == AV_PIX_FMT_YUV420P || sps->pix_fmt == AV_PIX_FMT_YUVJ420P ||
          sps->pix_fmt == AV_PIX_FMT_YUV420P10) {
+#if CONFIG_HEVC_D3D11VA_HWACCEL
+        *fmt++ = AV_PIX_FMT_D3D11VA_VLD;
+        *fmt++ = AV_PIX_FMT_D3D11;
+#endif
  #if CONFIG_HEVC_DXVA2_HWACCEL
          *fmt++ = AV_PIX_FMT_DXVA2_VLD;
+#endif
+#if CONFIG_HEVC_VAAPI_HWACCEL
+        *fmt++ = AV_PIX_FMT_VAAPI;
  #endif
      }
      if (sps->pix_fmt == AV_PIX_FMT_YUV420P || sps->pix_fmt == AV_PIX_FMT_YUVJ420P) {
-#if CONFIG_HEVC_D3D11VA_HWACCEL
-        *fmt++ = AV_PIX_FMT_D3D11VA_VLD;
-#endif
  #if CONFIG_HEVC_VDPAU_HWACCEL
          *fmt++ = AV_PIX_FMT_VDPAU;
  #endif
@@ -912,8 +918,8 @@ static void hls_residual_coding(HEVCContext *s, int x0, int y0,
      int vshift       = s->ps.sps->vshift[c_idx];
      uint8_t *dst     = &s->frame->data[c_idx][(y0 >> vshift) * stride +
                                                ((x0 >> hshift) << s->ps.sps->pixel_shift)];
-    DECLARE_ALIGNED(32, int16_t, coeffs[MAX_TB_SIZE * MAX_TB_SIZE]) = { 0 };
-    DECLARE_ALIGNED(8, uint8_t, significant_coeff_group_flag[8][8]) = { { 0 } };
+    LOCAL_ALIGNED_32(int16_t, coeffs, [MAX_TB_SIZE * MAX_TB_SIZE]);
+    LOCAL_ALIGNED_8(uint8_t, significant_coeff_group_flag, [8], [8]);
  
      int trafo_size = 1 << log2_trafo_size;
      int i, qp, shift, add, scale, scale_m;
@@ -921,6 +927,8 @@ static void hls_residual_coding(HEVCContext *s, int x0, int y0,
      const uint8_t *scale_matrix;
      uint8_t dc_scale;
  
+    memset(coeffs, 0, sizeof(int16_t) * MAX_TB_SIZE * MAX_TB_SIZE);
+    memset(significant_coeff_group_flag, 0, sizeof(uint8_t) * 8 * 8);
      // Derive QP for dequant
      if (!lc->cu.cu_transquant_bypass_flag) {
          static const int qp_c[] = {
@@ -1750,8 +1758,8 @@ static void hls_prediction_unit(HEVCContext *s, int x0, int y0,
      }
  
      if (current_mv.pred_flag[0] && !current_mv.pred_flag[1]) {
-        DECLARE_ALIGNED(16, int16_t,  tmp[MAX_PB_SIZE * MAX_PB_SIZE]);
-        DECLARE_ALIGNED(16, int16_t, tmp2[MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t,  tmp, [MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp2, [MAX_PB_SIZE * MAX_PB_SIZE]);
  
          luma_mc(s, tmp, tmpstride, ref0->frame,
                  &current_mv.mv[0], x0, y0, nPbW, nPbH, pred_idx);
@@ -1784,8 +1792,8 @@ static void hls_prediction_unit(HEVCContext *s, int x0, int y0,
              s->hevcdsp.put_unweighted_pred_chroma[pred_idx](dst2, s->frame->linesize[2], tmp2, tmpstride, nPbH / 2);
          }
      } else if (!current_mv.pred_flag[0] && current_mv.pred_flag[1]) {
-        DECLARE_ALIGNED(16, int16_t, tmp [MAX_PB_SIZE * MAX_PB_SIZE]);
-        DECLARE_ALIGNED(16, int16_t, tmp2[MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp,  [MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp2, [MAX_PB_SIZE * MAX_PB_SIZE]);
  
          luma_mc(s, tmp, tmpstride, ref1->frame,
                  &current_mv.mv[1], x0, y0, nPbW, nPbH, pred_idx);
@@ -1817,10 +1825,10 @@ static void hls_prediction_unit(HEVCContext *s, int x0, int y0,
              s->hevcdsp.put_unweighted_pred_chroma[pred_idx](dst2, s->frame->linesize[2], tmp2, tmpstride, nPbH / 2);
          }
      } else if (current_mv.pred_flag[0] && current_mv.pred_flag[1]) {
-        DECLARE_ALIGNED(16, int16_t, tmp [MAX_PB_SIZE * MAX_PB_SIZE]);
-        DECLARE_ALIGNED(16, int16_t, tmp2[MAX_PB_SIZE * MAX_PB_SIZE]);
-        DECLARE_ALIGNED(16, int16_t, tmp3[MAX_PB_SIZE * MAX_PB_SIZE]);
-        DECLARE_ALIGNED(16, int16_t, tmp4[MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp,  [MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp2, [MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp3, [MAX_PB_SIZE * MAX_PB_SIZE]);
+        LOCAL_ALIGNED_16(int16_t, tmp4, [MAX_PB_SIZE * MAX_PB_SIZE]);
  
          luma_mc(s, tmp, tmpstride, ref0->frame,
                  &current_mv.mv[0], x0, y0, nPbW, nPbH, pred_idx);
@@ -2355,18 +2363,18 @@ static int set_side_data(HEVCContext *s)
  {
      AVFrame *out = s->ref->frame;
  
-    if (s->sei_frame_packing_present &&
-        s->frame_packing_arrangement_type >= 3 &&
-        s->frame_packing_arrangement_type <= 5 &&
-        s->content_interpretation_type > 0 &&
-        s->content_interpretation_type < 3) {
+    if (s->sei.frame_packing.present &&
+        s->sei.frame_packing.arrangement_type >= 3 &&
+        s->sei.frame_packing.arrangement_type <= 5 &&
+        s->sei.frame_packing.content_interpretation_type > 0 &&
+        s->sei.frame_packing.content_interpretation_type < 3) {
          AVStereo3D *stereo = av_stereo3d_create_side_data(out);
          if (!stereo)
              return AVERROR(ENOMEM);
  
-        switch (s->frame_packing_arrangement_type) {
+        switch (s->sei.frame_packing.arrangement_type) {
          case 3:
-            if (s->quincunx_subsampling)
+            if (s->sei.frame_packing.quincunx_subsampling)
                  stereo->type = AV_STEREO3D_SIDEBYSIDE_QUINCUNX;
              else
                  stereo->type = AV_STEREO3D_SIDEBYSIDE;
@@ -2379,13 +2387,14 @@ static int set_side_data(HEVCContext *s)
              break;
          }
  
-        if (s->content_interpretation_type == 2)
+        if (s->sei.frame_packing.content_interpretation_type == 2)
              stereo->flags = AV_STEREO3D_FLAG_INVERT;
      }
  
-    if (s->sei_display_orientation_present &&
-        (s->sei_anticlockwise_rotation || s->sei_hflip || s->sei_vflip)) {
-        double angle = s->sei_anticlockwise_rotation * 360 / (double) (1 << 16);
+    if (s->sei.display_orientation.present &&
+        (s->sei.display_orientation.anticlockwise_rotation ||
+         s->sei.display_orientation.hflip || s->sei.display_orientation.vflip)) {
+        double angle = s->sei.display_orientation.anticlockwise_rotation * 360 / (double) (1 << 16);
          AVFrameSideData *rotation = av_frame_new_side_data(out,
                                                             AV_FRAME_DATA_DISPLAYMATRIX,
                                                             sizeof(int32_t) * 9);
@@ -2394,7 +2403,14 @@ static int set_side_data(HEVCContext *s)
  
          av_display_rotation_set((int32_t *)rotation->data, angle);
          av_display_matrix_flip((int32_t *)rotation->data,
-                               s->sei_hflip, s->sei_vflip);
+                               s->sei.display_orientation.hflip,
+                               s->sei.display_orientation.vflip);
+    }
+
+    if (s->sei.alternative_transfer.present &&
+        av_color_transfer_name(s->sei.alternative_transfer.preferred_transfer_characteristics) &&
+        s->sei.alternative_transfer.preferred_transfer_characteristics != AVCOL_TRC_UNSPECIFIED) {
+        s->avctx->color_trc = out->color_trc = s->sei.alternative_transfer.preferred_transfer_characteristics;
      }
  
      return 0;
@@ -2479,7 +2495,8 @@ static int decode_nal_unit(HEVCContext *s, const H2645NAL *nal)
          break;
      case HEVC_NAL_SEI_PREFIX:
      case HEVC_NAL_SEI_SUFFIX:
-        ret = ff_hevc_decode_nal_sei(s);
+        ret = ff_hevc_decode_nal_sei(gb, s->avctx, &s->sei,
+                                     s->nal_unit_type);
          if (ret < 0)
              goto fail;
          break;
@@ -2687,7 +2704,7 @@ static int verify_md5(HEVCContext *s, AVFrame *frame)
          }
          av_md5_final(s->md5_ctx, md5);
  
-        if (!memcmp(md5, s->md5[i], 16)) {
+        if (!memcmp(md5, s->sei.picture_hash.md5[i], 16)) {
              av_log   (s->avctx, AV_LOG_DEBUG, "plane %d - correct ", i);
              print_md5(s->avctx, AV_LOG_DEBUG, md5);
              av_log   (s->avctx, AV_LOG_DEBUG, "; ");
@@ -2695,7 +2712,7 @@ static int verify_md5(HEVCContext *s, AVFrame *frame)
              av_log   (s->avctx, AV_LOG_ERROR, "mismatching checksum of plane %d - ", i);
              print_md5(s->avctx, AV_LOG_ERROR, md5);
              av_log   (s->avctx, AV_LOG_ERROR, " != ");
-            print_md5(s->avctx, AV_LOG_ERROR, s->md5[i]);
+            print_md5(s->avctx, AV_LOG_ERROR, s->sei.picture_hash.md5[i]);
              av_log   (s->avctx, AV_LOG_ERROR, "\n");
              return AVERROR_INVALIDDATA;
          }
@@ -2815,7 +2832,7 @@ static int hevc_decode_frame(AVCodecContext *avctx, void *data, int *got_output,
      } else {
          /* verify the SEI checksum */
          if (avctx->err_recognition & AV_EF_CRCCHECK && s->is_decoded &&
-            s->is_md5) {
+            s->sei.picture_hash.is_md5) {
              ret = verify_md5(s, s->ref->frame);
              if (ret < 0 && avctx->err_recognition & AV_EF_EXPLODE) {
                  ff_hevc_unref_frame(s, s->ref, ~0);
@@ -2823,7 +2840,7 @@ static int hevc_decode_frame(AVCodecContext *avctx, void *data, int *got_output,
              }
          }
      }
-    s->is_md5 = 0;
+    s->sei.picture_hash.is_md5 = 0;
  
      if (s->is_decoded) {
          av_log(avctx, AV_LOG_DEBUG, "Decoded frame with POC %d.\n", s->poc);
@@ -2860,7 +2877,6 @@ static int hevc_ref_frame(HEVCContext *s, HEVCFrame *dst, HEVCFrame *src)
  
      dst->poc        = src->poc;
      dst->ctb_count  = src->ctb_count;
-    dst->window     = src->window;
      dst->flags      = src->flags;
      dst->sequence   = src->sequence;
  
@@ -3088,4 +3104,5 @@ AVCodec ff_hevc_decoder = {
      .capabilities          = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
                               AV_CODEC_CAP_FRAME_THREADS,
      .profiles              = NULL_IF_CONFIG_SMALL(ff_hevc_profiles),
+    .caps_internal         = FF_CODEC_CAP_EXPORTS_CROPPING | FF_CODEC_CAP_INIT_THREADSAFE,
  };