avframe: add AV_FRAME_DATA_MATRIXENCODING side data type.

[ffmpeg] / libavcodec / h264.c
diff --git a/libavcodec/h264.c b/libavcodec/h264.c

index d4f04c62989961fa4f321ef009b1ec225d4dbaee..3aa3af0a64fe48ac0e30ab1bf38191cd59e6902f 100644 (file)
--- a/libavcodec/h264.c
+++ b/libavcodec/h264.c
@@ -27,6 +27,7 @@
  
  #include "libavutil/avassert.h"
  #include "libavutil/imgutils.h"
+#include "libavutil/stereo3d.h"
  #include "internal.h"
  #include "cabac.h"
  #include "cabac_functions.h"
@@ -44,7 +45,6 @@
  #include "svq3.h"
  #include "thread.h"
  
-// #undef NDEBUG
  #include <assert.h>
  
  const uint16_t ff_h264_mb_sizes[4] = { 256, 384, 512, 768 };
@@ -61,6 +61,93 @@ static const uint8_t div6[QP_MAX_NUM + 1] = {
      7, 7, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10,
  };
  
+static const uint8_t field_scan[16] = {
+    0 + 0 * 4, 0 + 1 * 4, 1 + 0 * 4, 0 + 2 * 4,
+    0 + 3 * 4, 1 + 1 * 4, 1 + 2 * 4, 1 + 3 * 4,
+    2 + 0 * 4, 2 + 1 * 4, 2 + 2 * 4, 2 + 3 * 4,
+    3 + 0 * 4, 3 + 1 * 4, 3 + 2 * 4, 3 + 3 * 4,
+};
+
+static const uint8_t field_scan8x8[64] = {
+    0 + 0 * 8, 0 + 1 * 8, 0 + 2 * 8, 1 + 0 * 8,
+    1 + 1 * 8, 0 + 3 * 8, 0 + 4 * 8, 1 + 2 * 8,
+    2 + 0 * 8, 1 + 3 * 8, 0 + 5 * 8, 0 + 6 * 8,
+    0 + 7 * 8, 1 + 4 * 8, 2 + 1 * 8, 3 + 0 * 8,
+    2 + 2 * 8, 1 + 5 * 8, 1 + 6 * 8, 1 + 7 * 8,
+    2 + 3 * 8, 3 + 1 * 8, 4 + 0 * 8, 3 + 2 * 8,
+    2 + 4 * 8, 2 + 5 * 8, 2 + 6 * 8, 2 + 7 * 8,
+    3 + 3 * 8, 4 + 1 * 8, 5 + 0 * 8, 4 + 2 * 8,
+    3 + 4 * 8, 3 + 5 * 8, 3 + 6 * 8, 3 + 7 * 8,
+    4 + 3 * 8, 5 + 1 * 8, 6 + 0 * 8, 5 + 2 * 8,
+    4 + 4 * 8, 4 + 5 * 8, 4 + 6 * 8, 4 + 7 * 8,
+    5 + 3 * 8, 6 + 1 * 8, 6 + 2 * 8, 5 + 4 * 8,
+    5 + 5 * 8, 5 + 6 * 8, 5 + 7 * 8, 6 + 3 * 8,
+    7 + 0 * 8, 7 + 1 * 8, 6 + 4 * 8, 6 + 5 * 8,
+    6 + 6 * 8, 6 + 7 * 8, 7 + 2 * 8, 7 + 3 * 8,
+    7 + 4 * 8, 7 + 5 * 8, 7 + 6 * 8, 7 + 7 * 8,
+};
+
+static const uint8_t field_scan8x8_cavlc[64] = {
+    0 + 0 * 8, 1 + 1 * 8, 2 + 0 * 8, 0 + 7 * 8,
+    2 + 2 * 8, 2 + 3 * 8, 2 + 4 * 8, 3 + 3 * 8,
+    3 + 4 * 8, 4 + 3 * 8, 4 + 4 * 8, 5 + 3 * 8,
+    5 + 5 * 8, 7 + 0 * 8, 6 + 6 * 8, 7 + 4 * 8,
+    0 + 1 * 8, 0 + 3 * 8, 1 + 3 * 8, 1 + 4 * 8,
+    1 + 5 * 8, 3 + 1 * 8, 2 + 5 * 8, 4 + 1 * 8,
+    3 + 5 * 8, 5 + 1 * 8, 4 + 5 * 8, 6 + 1 * 8,
+    5 + 6 * 8, 7 + 1 * 8, 6 + 7 * 8, 7 + 5 * 8,
+    0 + 2 * 8, 0 + 4 * 8, 0 + 5 * 8, 2 + 1 * 8,
+    1 + 6 * 8, 4 + 0 * 8, 2 + 6 * 8, 5 + 0 * 8,
+    3 + 6 * 8, 6 + 0 * 8, 4 + 6 * 8, 6 + 2 * 8,
+    5 + 7 * 8, 6 + 4 * 8, 7 + 2 * 8, 7 + 6 * 8,
+    1 + 0 * 8, 1 + 2 * 8, 0 + 6 * 8, 3 + 0 * 8,
+    1 + 7 * 8, 3 + 2 * 8, 2 + 7 * 8, 4 + 2 * 8,
+    3 + 7 * 8, 5 + 2 * 8, 4 + 7 * 8, 5 + 4 * 8,
+    6 + 3 * 8, 6 + 5 * 8, 7 + 3 * 8, 7 + 7 * 8,
+};
+
+// zigzag_scan8x8_cavlc[i] = zigzag_scan8x8[(i/4) + 16*(i%4)]
+static const uint8_t zigzag_scan8x8_cavlc[64] = {
+    0 + 0 * 8, 1 + 1 * 8, 1 + 2 * 8, 2 + 2 * 8,
+    4 + 1 * 8, 0 + 5 * 8, 3 + 3 * 8, 7 + 0 * 8,
+    3 + 4 * 8, 1 + 7 * 8, 5 + 3 * 8, 6 + 3 * 8,
+    2 + 7 * 8, 6 + 4 * 8, 5 + 6 * 8, 7 + 5 * 8,
+    1 + 0 * 8, 2 + 0 * 8, 0 + 3 * 8, 3 + 1 * 8,
+    3 + 2 * 8, 0 + 6 * 8, 4 + 2 * 8, 6 + 1 * 8,
+    2 + 5 * 8, 2 + 6 * 8, 6 + 2 * 8, 5 + 4 * 8,
+    3 + 7 * 8, 7 + 3 * 8, 4 + 7 * 8, 7 + 6 * 8,
+    0 + 1 * 8, 3 + 0 * 8, 0 + 4 * 8, 4 + 0 * 8,
+    2 + 3 * 8, 1 + 5 * 8, 5 + 1 * 8, 5 + 2 * 8,
+    1 + 6 * 8, 3 + 5 * 8, 7 + 1 * 8, 4 + 5 * 8,
+    4 + 6 * 8, 7 + 4 * 8, 5 + 7 * 8, 6 + 7 * 8,
+    0 + 2 * 8, 2 + 1 * 8, 1 + 3 * 8, 5 + 0 * 8,
+    1 + 4 * 8, 2 + 4 * 8, 6 + 0 * 8, 4 + 3 * 8,
+    0 + 7 * 8, 4 + 4 * 8, 7 + 2 * 8, 3 + 6 * 8,
+    5 + 5 * 8, 6 + 5 * 8, 6 + 6 * 8, 7 + 7 * 8,
+};
+
+static const uint8_t dequant4_coeff_init[6][3] = {
+    { 10, 13, 16 },
+    { 11, 14, 18 },
+    { 13, 16, 20 },
+    { 14, 18, 23 },
+    { 16, 20, 25 },
+    { 18, 23, 29 },
+};
+
+static const uint8_t dequant8_coeff_init_scan[16] = {
+    0, 3, 4, 3, 3, 1, 5, 1, 4, 5, 2, 5, 3, 1, 5, 1
+};
+
+static const uint8_t dequant8_coeff_init[6][6] = {
+    { 20, 18, 32, 19, 25, 24 },
+    { 22, 19, 35, 21, 28, 26 },
+    { 26, 23, 42, 24, 33, 31 },
+    { 28, 25, 45, 26, 35, 33 },
+    { 32, 28, 51, 30, 40, 38 },
+    { 36, 32, 58, 34, 46, 43 },
+};
+
  static const enum AVPixelFormat h264_hwaccel_pixfmt_list_420[] = {
  #if CONFIG_H264_DXVA2_HWACCEL
      AV_PIX_FMT_DXVA2_VLD,
@@ -170,7 +257,7 @@ static void unref_picture(H264Context *h, Picture *pic)
      int off = offsetof(Picture, tf) + sizeof(pic->tf);
      int i;
  
-    if (!pic->f.data[0])
+    if (!pic->f.buf[0])
          return;
  
      ff_thread_release_buffer(h->avctx, &pic->tf);
@@ -192,7 +279,7 @@ static void release_unused_pictures(H264Context *h, int remove_current)
  
      /* release non reference frames */
      for (i = 0; i < MAX_PICTURE_COUNT; i++) {
-        if (h->DPB[i].f.data[0] && !h->DPB[i].reference &&
+        if (h->DPB[i].f.buf[0] && !h->DPB[i].reference &&
              (remove_current || &h->DPB[i] != h->cur_pic_ptr)) {
              unref_picture(h, &h->DPB[i]);
          }
@@ -250,6 +337,7 @@ static int ref_picture(H264Context *h, Picture *dst, Picture *src)
      dst->field_picture = src->field_picture;
      dst->needs_realloc = src->needs_realloc;
      dst->reference     = src->reference;
+    dst->recovered     = src->recovered;
  
      return 0;
  fail:
@@ -367,7 +455,7 @@ fail:
  
  static inline int pic_is_unused(H264Context *h, Picture *pic)
  {
-    if (pic->f.data[0] == NULL)
+    if (!pic->f.buf[0])
          return 1;
      if (pic->needs_realloc && !(pic->reference & DELAYED_PIC_REF))
          return 1;
@@ -789,7 +877,7 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
      const int mx      = h->mv_cache[list][scan8[n]][0] + src_x_offset * 8;
      int my            = h->mv_cache[list][scan8[n]][1] + src_y_offset * 8;
      const int luma_xy = (mx & 3) + ((my & 3) << 2);
-    int offset        = ((mx >> 2) << pixel_shift) + (my >> 2) * h->mb_linesize;
+    ptrdiff_t offset  = ((mx >> 2) << pixel_shift) + (my >> 2) * h->mb_linesize;
      uint8_t *src_y    = pic->f.data[0] + offset;
      uint8_t *src_cb, *src_cr;
      int extra_width  = 0;
@@ -812,7 +900,7 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
          full_my + 16 /*FIXME*/ > pic_height + extra_height) {
          h->vdsp.emulated_edge_mc(h->edge_emu_buffer,
                                   src_y - (2 << pixel_shift) - 2 * h->mb_linesize,
-                                 h->mb_linesize,
+                                 h->mb_linesize, h->mb_linesize,
                                   16 + 5, 16 + 5 /*FIXME*/, full_mx - 2,
                                   full_my - 2, pic_width, pic_height);
          src_y = h->edge_emu_buffer + (2 << pixel_shift) + 2 * h->mb_linesize;
@@ -831,7 +919,7 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
          if (emu) {
              h->vdsp.emulated_edge_mc(h->edge_emu_buffer,
                                       src_cb - (2 << pixel_shift) - 2 * h->mb_linesize,
-                                     h->mb_linesize,
+                                     h->mb_linesize, h->mb_linesize,
                                       16 + 5, 16 + 5 /*FIXME*/,
                                       full_mx - 2, full_my - 2,
                                       pic_width, pic_height);
@@ -845,7 +933,7 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
          if (emu) {
              h->vdsp.emulated_edge_mc(h->edge_emu_buffer,
                                       src_cr - (2 << pixel_shift) - 2 * h->mb_linesize,
-                                     h->mb_linesize,
+                                     h->mb_linesize, h->mb_linesize,
                                       16 + 5, 16 + 5 /*FIXME*/,
                                       full_mx - 2, full_my - 2,
                                       pic_width, pic_height);
@@ -870,7 +958,8 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
               (my >> ysh) * h->mb_uvlinesize;
  
      if (emu) {
-        h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cb, h->mb_uvlinesize,
+        h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cb,
+                                 h->mb_uvlinesize, h->mb_uvlinesize,
                                   9, 8 * chroma_idc + 1, (mx >> 3), (my >> ysh),
                                   pic_width >> 1, pic_height >> (chroma_idc == 1 /* yuv420 */));
          src_cb = h->edge_emu_buffer;
@@ -880,7 +969,8 @@ static av_always_inline void mc_dir_part(H264Context *h, Picture *pic,
                mx & 7, (my << (chroma_idc == 2 /* yuv422 */)) & 7);
  
      if (emu) {
-        h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cr, h->mb_uvlinesize,
+        h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cr,
+                                 h->mb_uvlinesize, h->mb_uvlinesize,
                                   9, 8 * chroma_idc + 1, (mx >> 3), (my >> ysh),
                                   pic_width >> 1, pic_height >> (chroma_idc == 1 /* yuv420 */));
          src_cr = h->edge_emu_buffer;
@@ -1251,8 +1341,8 @@ int ff_h264_alloc_tables(H264Context *h)
          if (!h->DPB)
              return AVERROR(ENOMEM);
          for (i = 0; i < MAX_PICTURE_COUNT; i++)
-            avcodec_get_frame_defaults(&h->DPB[i].f);
-        avcodec_get_frame_defaults(&h->cur_pic.f);
+            av_frame_unref(&h->DPB[i].f);
+        av_frame_unref(&h->cur_pic.f);
      }
  
      return 0;
@@ -1462,6 +1552,8 @@ av_cold int ff_h264_decode_init(AVCodecContext *avctx)
  
      ff_h264_decode_init_vlc();
  
+    ff_init_cabac_states();
+
      h->pixel_shift        = 0;
      h->sps.bit_depth_luma = avctx->bits_per_raw_sample = 8;
  
@@ -1472,6 +1564,8 @@ av_cold int ff_h264_decode_init(AVCodecContext *avctx)
      h->prev_poc_msb = 1 << 16;
      h->x264_build   = -1;
      ff_h264_reset_sei(h);
+    h->recovery_frame = -1;
+    h->frame_recovered = 0;
      if (avctx->codec_id == AV_CODEC_ID_H264) {
          if (avctx->ticks_per_frame == 1)
              h->avctx->time_base.den *= 2;
@@ -1517,19 +1611,24 @@ static void copy_picture_range(Picture **to, Picture **from, int count,
      }
  }
  
-static void copy_parameter_set(void **to, void **from, int count, int size)
+static int copy_parameter_set(void **to, void **from, int count, int size)
  {
      int i;
  
      for (i = 0; i < count; i++) {
-        if (to[i] && !from[i])
+        if (to[i] && !from[i]) {
              av_freep(&to[i]);
-        else if (from[i] && !to[i])
+        } else if (from[i] && !to[i]) {
              to[i] = av_malloc(size);
+            if (!to[i])
+                return AVERROR(ENOMEM);
+        }
  
          if (from[i])
              memcpy(to[i], from[i], size);
      }
+
+    return 0;
  }
  
  static int decode_init_thread_copy(AVCodecContext *avctx)
@@ -1622,7 +1721,7 @@ static int decode_update_thread_context(AVCodecContext *dst,
          h->context_initialized = 0;
  
          memset(&h->cur_pic, 0, sizeof(h->cur_pic));
-        avcodec_get_frame_defaults(&h->cur_pic.f);
+        av_frame_unref(&h->cur_pic.f);
          h->cur_pic.tf.f = &h->cur_pic.f;
  
          h->avctx             = dst;
@@ -1637,7 +1736,11 @@ static int decode_update_thread_context(AVCodecContext *dst,
              av_log(dst, AV_LOG_ERROR, "Could not allocate memory for h264\n");
              return ret;
          }
-        context_init(h);
+        ret = context_init(h);
+        if (ret < 0) {
+            av_log(dst, AV_LOG_ERROR, "context_init() failed.\n");
+            return ret;
+        }
  
          for (i = 0; i < 2; i++) {
              h->rbsp_buffer[i]      = NULL;
@@ -1665,7 +1768,7 @@ static int decode_update_thread_context(AVCodecContext *dst,
  
      for (i = 0; i < MAX_PICTURE_COUNT; i++) {
          unref_picture(h, &h->DPB[i]);
-        if (h1->DPB[i].f.data[0] &&
+        if (h1->DPB[i].f.buf[0] &&
              (ret = ref_picture(h, &h->DPB[i], &h1->DPB[i])) < 0)
              return ret;
      }
@@ -1689,11 +1792,15 @@ static int decode_update_thread_context(AVCodecContext *dst,
      h->is_avc = h1->is_avc;
  
      // SPS/PPS
-    copy_parameter_set((void **)h->sps_buffers, (void **)h1->sps_buffers,
-                       MAX_SPS_COUNT, sizeof(SPS));
+    if ((ret = copy_parameter_set((void **)h->sps_buffers,
+                                  (void **)h1->sps_buffers,
+                                  MAX_SPS_COUNT, sizeof(SPS))) < 0)
+        return ret;
      h->sps = h1->sps;
-    copy_parameter_set((void **)h->pps_buffers, (void **)h1->pps_buffers,
-                       MAX_PPS_COUNT, sizeof(PPS));
+    if ((ret = copy_parameter_set((void **)h->pps_buffers,
+                                  (void **)h1->pps_buffers,
+                                  MAX_PPS_COUNT, sizeof(PPS))) < 0)
+        return ret;
      h->pps = h1->pps;
  
      // Dequantization matrices
@@ -1738,6 +1845,9 @@ static int decode_update_thread_context(AVCodecContext *dst,
      h->prev_frame_num        = h->frame_num;
      h->outputed_poc          = h->next_outputed_poc;
  
+    h->recovery_frame        = h1->recovery_frame;
+    h->frame_recovered       = h1->frame_recovered;
+
      return err;
  }
  
@@ -1767,6 +1877,7 @@ static int h264_frame_start(H264Context *h)
       */
      pic->f.key_frame = 0;
      pic->mmco_reset  = 0;
+    pic->recovered   = 0;
  
      if ((ret = alloc_picture(h, pic)) < 0)
          return ret;
@@ -1919,6 +2030,46 @@ static void decode_postinit(H264Context *h, int setup_finished)
          }
      }
  
+    if (h->sei_frame_packing_present &&
+        h->frame_packing_arrangement_type >= 0 &&
+        h->frame_packing_arrangement_type <= 6 &&
+        h->content_interpretation_type > 0 &&
+        h->content_interpretation_type < 3) {
+        AVStereo3D *stereo = av_stereo3d_create_side_data(&cur->f);
+        if (!stereo)
+            return;
+
+        switch (h->frame_packing_arrangement_type) {
+        case 0:
+            stereo->type = AV_STEREO3D_CHECKERBOARD;
+            break;
+        case 1:
+            stereo->type = AV_STEREO3D_LINES;
+            break;
+        case 2:
+            stereo->type = AV_STEREO3D_COLUMNS;
+            break;
+        case 3:
+            if (h->quincunx_subsampling)
+                stereo->type = AV_STEREO3D_SIDEBYSIDE_QUINCUNX;
+            else
+                stereo->type = AV_STEREO3D_SIDEBYSIDE;
+            break;
+        case 4:
+            stereo->type = AV_STEREO3D_TOPBOTTOM;
+            break;
+        case 5:
+            stereo->type = AV_STEREO3D_FRAMESEQUENCE;
+            break;
+        case 6:
+            stereo->type = AV_STEREO3D_2D;
+            break;
+        }
+
+        if (h->content_interpretation_type == 2)
+            stereo->flags = AV_STEREO3D_FLAG_INVERT;
+    }
+
      // FIXME do something with unavailable reference frames
  
      /* Sort B-frames into display order */
@@ -2038,6 +2189,15 @@ static void decode_postinit(H264Context *h, int setup_finished)
          av_log(h->avctx, AV_LOG_DEBUG, "no picture\n");
      }
  
+    if (h->next_output_pic) {
+        if (h->next_output_pic->recovered) {
+            // We have reached an recovery point and all frames after it in
+            // display order are "recovered".
+            h->frame_recovered |= FRAME_RECOVERED_SEI;
+        }
+        h->next_output_pic->recovered |= !!(h->frame_recovered & FRAME_RECOVERED_SEI);
+    }
+
      if (setup_finished && !h->avctx->hwaccel)
          ff_thread_finish_setup(h->avctx);
  }
@@ -2462,7 +2622,7 @@ void ff_h264_hl_decode_mb(H264Context *h)
          hl_decode_mb_simple_8(h);
  }
  
-static int pred_weight_table(H264Context *h)
+int ff_pred_weight_table(H264Context *h)
  {
      int list, i;
      int luma_def, chroma_def;
@@ -2619,6 +2779,8 @@ static void flush_change(H264Context *h)
      memset(h->default_ref_list[0], 0, sizeof(h->default_ref_list[0]));
      memset(h->default_ref_list[1], 0, sizeof(h->default_ref_list[1]));
      ff_h264_reset_sei(h);
+    h->recovery_frame = -1;
+    h->frame_recovered = 0;
  }
  
  /* forget old pics after a seek */
@@ -2649,6 +2811,9 @@ static void flush_dpb(AVCodecContext *avctx)
      h->parse_context.overread_index    = 0;
      h->parse_context.index             = 0;
      h->parse_context.last_index        = 0;
+
+    free_tables(h, 1);
+    h->context_initialized = 0;
  }
  
  int ff_init_poc(H264Context *h, int pic_field_poc[2], int *pic_poc)
@@ -3025,7 +3190,7 @@ static int h264_slice_header_init(H264Context *h, int reinit)
                    h->sps.num_units_in_tick, den, 1 << 30);
      }
  
-    h->avctx->hwaccel = ff_find_hwaccel(h->avctx->codec->id, h->avctx->pix_fmt);
+    h->avctx->hwaccel = ff_find_hwaccel(h->avctx);
  
      if (reinit)
          free_tables(h, 0);
@@ -3062,6 +3227,8 @@ static int h264_slice_header_init(H264Context *h, int reinit)
          for (i = 1; i < h->slice_context_count; i++) {
              H264Context *c;
              c                    = h->thread_context[i] = av_mallocz(sizeof(H264Context));
+            if (!c)
+                return AVERROR(ENOMEM);
              c->avctx             = h->avctx;
              c->dsp               = h->dsp;
              c->vdsp              = h->vdsp;
@@ -3106,6 +3273,50 @@ static int h264_slice_header_init(H264Context *h, int reinit)
      return 0;
  }
  
+int ff_set_ref_count(H264Context *h)
+{
+    int num_ref_idx_active_override_flag, max_refs;
+
+    // set defaults, might be overridden a few lines later
+    h->ref_count[0] = h->pps.ref_count[0];
+    h->ref_count[1] = h->pps.ref_count[1];
+
+    if (h->slice_type_nos != AV_PICTURE_TYPE_I) {
+        if (h->slice_type_nos == AV_PICTURE_TYPE_B)
+            h->direct_spatial_mv_pred = get_bits1(&h->gb);
+        num_ref_idx_active_override_flag = get_bits1(&h->gb);
+
+        if (num_ref_idx_active_override_flag) {
+            h->ref_count[0] = get_ue_golomb(&h->gb) + 1;
+            if (h->ref_count[0] < 1)
+                return AVERROR_INVALIDDATA;
+            if (h->slice_type_nos == AV_PICTURE_TYPE_B) {
+                h->ref_count[1] = get_ue_golomb(&h->gb) + 1;
+                if (h->ref_count[1] < 1)
+                    return AVERROR_INVALIDDATA;
+            }
+        }
+
+        if (h->slice_type_nos == AV_PICTURE_TYPE_B)
+            h->list_count = 2;
+        else
+            h->list_count = 1;
+    } else {
+        h->list_count   = 0;
+        h->ref_count[0] = h->ref_count[1] = 0;
+    }
+
+    max_refs = h->picture_structure == PICT_FRAME ? 16 : 32;
+
+    if (h->ref_count[0] > max_refs || h->ref_count[1] > max_refs) {
+        av_log(h->avctx, AV_LOG_ERROR, "reference overflow\n");
+        h->ref_count[0] = h->ref_count[1] = 0;
+        return AVERROR_INVALIDDATA;
+    }
+
+    return 0;
+}
+
  /**
   * Decode a slice header.
   * This will also call ff_MPV_common_init() and frame_start() as needed.
@@ -3120,7 +3331,7 @@ static int decode_slice_header(H264Context *h, H264Context *h0)
  {
      unsigned int first_mb_in_slice;
      unsigned int pps_id;
-    int num_ref_idx_active_override_flag, max_refs, ret;
+    int ret;
      unsigned int slice_type, tmp, i, j;
      int default_ref_list_done = 0;
      int last_pic_structure, last_pic_droppable;
@@ -3354,7 +3565,7 @@ static int decode_slice_header(H264Context *h, H264Context *h0)
           * since that can modify s->current_picture_ptr. */
          if (h0->first_field) {
              assert(h0->cur_pic_ptr);
-            assert(h0->cur_pic_ptr->f.data[0]);
+            assert(h0->cur_pic_ptr->f.buf[0]);
              assert(h0->cur_pic_ptr->reference != DELAYED_PIC_REF);
  
              /* figure out if we have a complementary field pair */
@@ -3444,7 +3655,7 @@ static int decode_slice_header(H264Context *h, H264Context *h0)
           * frame, or to allocate a new one. */
          if (h0->first_field) {
              assert(h0->cur_pic_ptr);
-            assert(h0->cur_pic_ptr->f.data[0]);
+            assert(h0->cur_pic_ptr->f.buf[0]);
              assert(h0->cur_pic_ptr->reference != DELAYED_PIC_REF);
  
              /* figure out if we have a complementary field pair */
@@ -3527,42 +3738,9 @@ static int decode_slice_header(H264Context *h, H264Context *h0)
      if (h->pps.redundant_pic_cnt_present)
          h->redundant_pic_count = get_ue_golomb(&h->gb);
  
-    // set defaults, might be overridden a few lines later
-    h->ref_count[0] = h->pps.ref_count[0];
-    h->ref_count[1] = h->pps.ref_count[1];
-
-    if (h->slice_type_nos != AV_PICTURE_TYPE_I) {
-        if (h->slice_type_nos == AV_PICTURE_TYPE_B)
-            h->direct_spatial_mv_pred = get_bits1(&h->gb);
-        num_ref_idx_active_override_flag = get_bits1(&h->gb);
-
-        if (num_ref_idx_active_override_flag) {
-            h->ref_count[0] = get_ue_golomb(&h->gb) + 1;
-            if (h->ref_count[0] < 1)
-                return AVERROR_INVALIDDATA;
-            if (h->slice_type_nos == AV_PICTURE_TYPE_B) {
-                h->ref_count[1] = get_ue_golomb(&h->gb) + 1;
-                if (h->ref_count[1] < 1)
-                    return AVERROR_INVALIDDATA;
-            }
-        }
-
-        if (h->slice_type_nos == AV_PICTURE_TYPE_B)
-            h->list_count = 2;
-        else
-            h->list_count = 1;
-    } else {
-        h->list_count   = 0;
-        h->ref_count[0] = h->ref_count[1] = 0;
-    }
-
-    max_refs = h->picture_structure == PICT_FRAME ? 16 : 32;
-
-    if (h->ref_count[0] > max_refs || h->ref_count[1] > max_refs) {
-        av_log(h->avctx, AV_LOG_ERROR, "reference overflow\n");
-        h->ref_count[0] = h->ref_count[1] = 0;
-        return AVERROR_INVALIDDATA;
-    }
+    ret = ff_set_ref_count(h);
+    if (ret < 0)
+        return ret;
  
      if (!default_ref_list_done)
          ff_h264_fill_default_ref_list(h);
@@ -3578,7 +3756,7 @@ static int decode_slice_header(H264Context *h, H264Context *h0)
      if ((h->pps.weighted_pred && h->slice_type_nos == AV_PICTURE_TYPE_P) ||
          (h->pps.weighted_bipred_idc == 1 &&
           h->slice_type_nos == AV_PICTURE_TYPE_B))
-        pred_weight_table(h);
+        ff_pred_weight_table(h);
      else if (h->pps.weighted_bipred_idc == 2 &&
               h->slice_type_nos == AV_PICTURE_TYPE_B) {
          implicit_weight_table(h, -1);
@@ -4154,7 +4332,6 @@ static int decode_slice(struct AVCodecContext *avctx, void *arg)
          align_get_bits(&h->gb);
  
          /* init cabac */
-        ff_init_cabac_states();
          ff_init_cabac_decoder(&h->cabac,
                                h->gb.buffer + get_bits_count(&h->gb) / 8,
                                (get_bits_left(&h->gb) + 7) / 8);
@@ -4338,8 +4515,6 @@ static int execute_decode_slices(H264Context *h, int context_count)
      return 0;
  }
  
-static const uint8_t start_code[] = { 0x00, 0x00, 0x01 };
-
  static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size,
                              int parse_extradata)
  {
@@ -4420,7 +4595,7 @@ static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size,
                  h->workaround_bugs |= FF_BUG_TRUNCATED;
  
              if (!(h->workaround_bugs & FF_BUG_TRUNCATED))
-                while (ptr[dst_length - 1] == 0 && dst_length > 0)
+                while (dst_length > 0 && ptr[dst_length - 1] == 0)
                      dst_length--;
              bit_length = !dst_length ? 0
                                       : (8 * dst_length -
@@ -4459,8 +4634,9 @@ static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size,
                  continue;
              }
  
-            // FIXME do not discard SEI id
-            if (avctx->skip_frame >= AVDISCARD_NONREF && h->nal_ref_idc == 0)
+            if (avctx->skip_frame >= AVDISCARD_NONREF &&
+                h->nal_ref_idc == 0 &&
+                h->nal_unit_type != NAL_SEI)
                  continue;
  
  again:
@@ -4471,8 +4647,11 @@ again:
                  (h->avctx->active_thread_type & FF_THREAD_FRAME) &&
                  (hx->nal_unit_type != NAL_PPS &&
                   hx->nal_unit_type != NAL_SPS)) {
-                av_log(avctx, AV_LOG_INFO, "Ignoring NAL unit %d during "
-                       "extradata parsing\n", hx->nal_unit_type);
+                if (hx->nal_unit_type < NAL_AUD ||
+                    hx->nal_unit_type > NAL_AUXILIARY_SLICE)
+                    av_log(avctx, AV_LOG_INFO,
+                           "Ignoring NAL unit %d during extradata parsing\n",
+                           hx->nal_unit_type);
                  hx->nal_unit_type = NAL_FF_IGNORE;
              }
              err = 0;
@@ -4494,10 +4673,26 @@ again:
                  if ((err = decode_slice_header(hx, h)))
                      break;
  
+                if (h->sei_recovery_frame_cnt >= 0 && h->recovery_frame < 0) {
+                    h->recovery_frame = (h->frame_num + h->sei_recovery_frame_cnt) &
+                                        ((1 << h->sps.log2_max_frame_num) - 1);
+                }
+
                  h->cur_pic_ptr->f.key_frame |=
                      (hx->nal_unit_type == NAL_IDR_SLICE) ||
                      (h->sei_recovery_frame_cnt >= 0);
  
+                if (hx->nal_unit_type == NAL_IDR_SLICE ||
+                    h->recovery_frame == h->frame_num) {
+                    h->recovery_frame         = -1;
+                    h->cur_pic_ptr->recovered = 1;
+                }
+                // If we have an IDR, all frames after it in decoded order are
+                // "recovered".
+                if (hx->nal_unit_type == NAL_IDR_SLICE)
+                    h->frame_recovered |= FRAME_RECOVERED_IDR;
+                h->cur_pic_ptr->recovered |= !!(h->frame_recovered & FRAME_RECOVERED_IDR);
+
                  if (h->current_slice == 1) {
                      if (!(avctx->flags2 & CODEC_FLAG2_CHUNKS))
                          decode_postinit(h, nal_index >= nals_needed);
@@ -4530,8 +4725,13 @@ again:
                  hx->intra_gb_ptr =
                  hx->inter_gb_ptr = NULL;
  
-                if ((err = decode_slice_header(hx, h)) < 0)
+                if ((err = decode_slice_header(hx, h)) < 0) {
+                    /* make sure data_partitioning is cleared if it was set
+                     * before, so we don't try decoding a slice without a valid
+                     * slice header later */
+                    h->data_partitioning = 0;
                      break;
+                }
  
                  hx->data_partitioning = 1;
                  break;
@@ -4658,8 +4858,8 @@ static int output_frame(H264Context *h, AVFrame *dst, AVFrame *src)
      return 0;
  }
  
-static int decode_frame(AVCodecContext *avctx, void *data,
-                        int *got_frame, AVPacket *avpkt)
+static int h264_decode_frame(AVCodecContext *avctx, void *data,
+                             int *got_frame, AVPacket *avpkt)
  {
      const uint8_t *buf = avpkt->data;
      int buf_size       = avpkt->size;
@@ -4727,10 +4927,12 @@ out:
  
          field_end(h, 0);
  
-        if (!h->next_output_pic) {
-            /* Wait for second field. */
-            *got_frame = 0;
-        } else {
+        *got_frame = 0;
+        if (h->next_output_pic && ((avctx->flags & CODEC_FLAG_OUTPUT_CORRUPT) ||
+                                   h->next_output_pic->recovered)) {
+            if (!h->next_output_pic->recovered)
+                h->next_output_pic->f.flags |= AV_FRAME_FLAG_CORRUPT;
+
              ret = output_frame(h, pict, &h->next_output_pic->f);
              if (ret < 0)
                  return ret;
@@ -4738,7 +4940,7 @@ out:
          }
      }
  
-    assert(pict->data[0] || !*got_frame);
+    assert(pict->buf[0] || !*got_frame);
  
      return get_consumed_bytes(buf_index, buf_size);
  }
@@ -4786,17 +4988,17 @@ static const AVProfile profiles[] = {
  
  AVCodec ff_h264_decoder = {
      .name                  = "h264",
+    .long_name             = NULL_IF_CONFIG_SMALL("H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
      .type                  = AVMEDIA_TYPE_VIDEO,
      .id                    = AV_CODEC_ID_H264,
      .priv_data_size        = sizeof(H264Context),
      .init                  = ff_h264_decode_init,
      .close                 = h264_decode_end,
-    .decode                = decode_frame,
+    .decode                = h264_decode_frame,
      .capabilities          = /*CODEC_CAP_DRAW_HORIZ_BAND |*/ CODEC_CAP_DR1 |
                               CODEC_CAP_DELAY | CODEC_CAP_SLICE_THREADS |
                               CODEC_CAP_FRAME_THREADS,
      .flush                 = flush_dpb,
-    .long_name             = NULL_IF_CONFIG_SMALL("H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
      .init_thread_copy      = ONLY_IF_THREADS_ENABLED(decode_init_thread_copy),
      .update_thread_context = ONLY_IF_THREADS_ENABLED(decode_update_thread_context),
      .profiles              = NULL_IF_CONFIG_SMALL(profiles),