hevc: change the stride of the MC buffer to be in bytes instead of elements

[ffmpeg] / libavcodec / h264.h
diff --git a/libavcodec/h264.h b/libavcodec/h264.h

index 069600029407c2b6907e5e7e77a0be3c884f6b4d..e9fd9ccec5a5d2d9ba0d643eb7199c19e5dac912 100644 (file)
--- a/libavcodec/h264.h
+++ b/libavcodec/h264.h
@@ -29,6 +29,7 @@
  #define AVCODEC_H264_H
  
  #include "libavutil/intreadwrite.h"
+#include "libavutil/thread.h"
  #include "cabac.h"
  #include "error_resilience.h"
  #include "get_bits.h"
@@ -36,6 +37,7 @@
  #include "h264dsp.h"
  #include "h264pred.h"
  #include "h264qpel.h"
+#include "internal.h"
  #include "mpegutils.h"
  #include "parser.h"
  #include "qpeldsp.h"
@@ -128,6 +130,7 @@ enum {
  typedef enum {
      SEI_TYPE_BUFFERING_PERIOD       = 0,   ///< buffering period (H.264, D.1.1)
      SEI_TYPE_PIC_TIMING             = 1,   ///< picture timing
+    SEI_TYPE_USER_DATA_REGISTERED   = 4,   ///< registered user data as specified by Rec. ITU-T T.35
      SEI_TYPE_USER_DATA_UNREGISTERED = 5,   ///< unregistered user data
      SEI_TYPE_RECOVERY_POINT         = 6,   ///< recovery point (frame # to decoder sync)
      SEI_TYPE_FRAME_PACKING          = 45,  ///< frame packing arrangement
@@ -260,7 +263,7 @@ typedef struct MMCO {
  } MMCO;
  
  typedef struct H264Picture {
-    struct AVFrame f;
+    AVFrame *f;
      ThreadFrame tf;
  
      AVBufferRef *qscale_table_buf;
@@ -291,13 +294,25 @@ typedef struct H264Picture {
      int mbaff;              ///< 1 -> MBAFF frame 0-> not MBAFF
      int field_picture;      ///< whether or not picture was encoded in separate fields
  
-    int needs_realloc;      ///< picture needs to be reallocated (eg due to a frame size change)
      int reference;
      int recovered;          ///< picture at IDR or recovery point + recovery count
  } H264Picture;
  
+typedef struct H264Ref {
+    uint8_t *data[3];
+    int linesize[3];
+
+    int reference;
+    int poc;
+    int pic_id;
+
+    H264Picture *parent;
+} H264Ref;
+
  typedef struct H264SliceContext {
      struct H264Context *h264;
+    GetBitContext gb;
+    ERContext er;
  
      int slice_num;
      int slice_type;
@@ -353,9 +368,22 @@ typedef struct H264SliceContext {
      unsigned int topright_samples_available;
      unsigned int left_samples_available;
  
+    ptrdiff_t linesize, uvlinesize;
      ptrdiff_t mb_linesize;  ///< may be equal to s->linesize or s->linesize * 2, for mbaff
      ptrdiff_t mb_uvlinesize;
  
+    int mb_x, mb_y;
+    int mb_xy;
+    int resync_mb_x;
+    int resync_mb_y;
+    // index of the first MB of the next slice
+    int next_slice_idx;
+    int mb_skip_run;
+    int is_complex;
+
+    int mb_field_decoding_flag;
+    int mb_mbaff;               ///< mb_aff_frame && mb_field_decoding_flag
+
      int redundant_pic_count;
  
      /**
@@ -381,12 +409,20 @@ typedef struct H264SliceContext {
       */
      unsigned int ref_count[2];          ///< counts frames or fields, depending on current mb mode
      unsigned int list_count;
-    H264Picture ref_list[2][48];        /**< 0..15: frame refs, 16..47: mbaff field refs.
+    H264Ref ref_list[2][48];        /**< 0..15: frame refs, 16..47: mbaff field refs.
                                           *   Reordered version of default_ref_list
                                           *   according to picture reordering in slice header */
      int ref2frm[MAX_SLICES][2][64];     ///< reference to frame number lists, used in the loop filter, the first 2 are for -2,-1
  
      const uint8_t *intra_pcm_ptr;
+    int16_t *dc_val_base;
+
+    uint8_t *bipred_scratchpad;
+    uint8_t *edge_emu_buffer;
+    uint8_t (*top_borders[2])[(16 * 3) * 2];
+    int bipred_scratchpad_allocated;
+    int edge_emu_buffer_allocated;
+    int top_borders_allocated[2];
  
      /**
       * non zero coeff count cache.
@@ -419,6 +455,10 @@ typedef struct H264SliceContext {
      CABACContext cabac;
      uint8_t cabac_state[1024];
      int cabac_init_idc;
+
+    // rbsp buffer used for this slice
+    uint8_t *rbsp_buffer;
+    unsigned int rbsp_buffer_size;
  } H264SliceContext;
  
  /**
@@ -431,9 +471,8 @@ typedef struct H264Context {
      H264ChromaContext h264chroma;
      H264QpelContext h264qpel;
      GetBitContext gb;
-    ERContext er;
  
-    H264Picture *DPB;
+    H264Picture DPB[H264_MAX_PICTURE_COUNT];
      H264Picture *cur_pic_ptr;
      H264Picture cur_pic;
  
@@ -444,7 +483,6 @@ typedef struct H264Context {
  
      /* coded dimensions -- 16 * mb w/h */
      int width, height;
-    ptrdiff_t linesize, uvlinesize;
      int chroma_x_shift, chroma_y_shift;
  
      int droppable;
@@ -457,7 +495,6 @@ typedef struct H264Context {
  
      int8_t(*intra4x4_pred_mode);
      H264PredContext hpc;
-    uint8_t (*top_borders[2])[(16 * 3) * 2];
  
      uint8_t (*non_zero_count)[48];
  
@@ -486,19 +523,11 @@ typedef struct H264Context {
  
      // interlacing specific flags
      int mb_aff_frame;
-    int mb_field_decoding_flag;
-    int mb_mbaff;               ///< mb_aff_frame && mb_field_decoding_flag
      int picture_structure;
      int first_field;
  
      uint8_t *list_counts;               ///< Array of list_count per MB specifying the slice type
  
-    // data partitioning
-    GetBitContext intra_gb;
-    GetBitContext inter_gb;
-    GetBitContext *intra_gb_ptr;
-    GetBitContext *inter_gb_ptr;
-
      /* 0x100 -> non null luma_dc, 0x80/0x40 -> non null chroma_dc (cb/cr), 0x?0 -> chroma_cbp(0, 1, 2), 0x0? luma_cbp */
      uint16_t *cbp_table;
  
@@ -522,24 +551,16 @@ typedef struct H264Context {
  
      int x264_build;
  
-    int mb_x, mb_y;
-    int resync_mb_x;
-    int resync_mb_y;
-    int mb_skip_run;
+    int mb_y;
      int mb_height, mb_width;
      int mb_stride;
      int mb_num;
-    int mb_xy;
-
-    int is_complex;
  
      // =============================================================
      // Things below are not used in the MB or more inner code
  
      int nal_ref_idc;
      int nal_unit_type;
-    uint8_t *rbsp_buffer[2];
-    unsigned int rbsp_buffer_size[2];
  
      /**
       * Used to parse AVC variant of h264
@@ -579,13 +600,12 @@ typedef struct H264Context {
       */
      int max_pic_num;
  
-    H264Picture default_ref_list[2][32]; ///< base reference list for all slices of a coded picture
+    H264Ref default_ref_list[2][32]; ///< base reference list for all slices of a coded picture
      H264Picture *short_ref[32];
      H264Picture *long_ref[32];
      H264Picture *delayed_pic[MAX_DELAYED_PIC_COUNT + 2]; // FIXME size?
      int last_pocs[MAX_DELAYED_PIC_COUNT];
      H264Picture *next_output_pic;
-    int outputed_poc;
      int next_outputed_poc;
  
      /**
@@ -602,8 +622,6 @@ typedef struct H264Context {
       * @name Members for slice based multithreading
       * @{
       */
-    struct H264Context *thread_context[H264_MAX_THREADS];
-
      /**
       * current slice number, used to initalize slice_num of each thread/context
       */
@@ -658,6 +676,14 @@ typedef struct H264Context {
      int sei_anticlockwise_rotation;
      int sei_hflip, sei_vflip;
  
+    /**
+     * User data registered by Rec. ITU-T T.35 SEI
+     */
+    int sei_reguserdata_afd_present;
+    uint8_t active_format_description;
+    int a53_caption_size;
+    uint8_t *a53_caption;
+
      /**
       * Bit set of clock types for fields/frames in picture timing SEI message.
       * For each found ct_type, appropriate bit is set (e.g., bit 1 for
@@ -705,15 +731,17 @@ typedef struct H264Context {
  
      int frame_recovered;    ///< Initial frame has been completely recovered
  
+    /* for frame threading, this is set to 1
+     * after finish_setup() has been called, so we cannot modify
+     * some context properties (which are supposed to stay constant between
+     * slices) anymore */
+    int setup_finished;
  
      // Timestamp stuff
      int sei_buffering_period_present;   ///< Buffering period SEI flag
      int initial_cpb_removal_delay[32];  ///< Initial timestamps for CPBs
  
-    int cur_chroma_format_idc;
-    uint8_t *bipred_scratchpad;
-    uint8_t *edge_emu_buffer;
-    int16_t *dc_val_base;
+    int enable_er;
  
      AVBufferPool *qscale_table_pool;
      AVBufferPool *mb_type_pool;
@@ -756,7 +784,7 @@ int ff_h264_decode_picture_parameter_set(H264Context *h, int bit_length);
   *                   or a decode rbsp tailing?
   * @return decoded bytes, might be src+1 if no escapes
   */
-const uint8_t *ff_h264_decode_nal(H264Context *h, const uint8_t *src,
+const uint8_t *ff_h264_decode_nal(H264Context *h, H264SliceContext *sl, const uint8_t *src,
                                    int *dst_length, int *consumed, int length);
  
  /**
@@ -799,16 +827,16 @@ int ff_generate_sliding_window_mmcos(H264Context *h, int first_slice);
   * Check if the top & left blocks are available if needed & change the
   * dc mode so it only uses the available blocks.
   */
-int ff_h264_check_intra4x4_pred_mode(H264Context *h, H264SliceContext *sl);
+int ff_h264_check_intra4x4_pred_mode(const H264Context *h, H264SliceContext *sl);
  
  /**
   * Check if the top & left blocks are available if needed & change the
   * dc mode so it only uses the available blocks.
   */
-int ff_h264_check_intra_pred_mode(H264Context *h, H264SliceContext *sl,
+int ff_h264_check_intra_pred_mode(const H264Context *h, H264SliceContext *sl,
                                    int mode, int is_chroma);
  
-void ff_h264_hl_decode_mb(H264Context *h, H264SliceContext *sl);
+void ff_h264_hl_decode_mb(const H264Context *h, H264SliceContext *sl);
  int ff_h264_decode_extradata(H264Context *h);
  int ff_h264_decode_init(AVCodecContext *avctx);
  void ff_h264_decode_init_vlc(void);
@@ -817,27 +845,27 @@ void ff_h264_decode_init_vlc(void);
   * Decode a macroblock
   * @return 0 if OK, ER_AC_ERROR / ER_DC_ERROR / ER_MV_ERROR on error
   */
-int ff_h264_decode_mb_cavlc(H264Context *h, H264SliceContext *sl);
+int ff_h264_decode_mb_cavlc(const H264Context *h, H264SliceContext *sl);
  
  /**
   * Decode a CABAC coded macroblock
   * @return 0 if OK, ER_AC_ERROR / ER_DC_ERROR / ER_MV_ERROR on error
   */
-int ff_h264_decode_mb_cabac(H264Context *h, H264SliceContext *sl);
+int ff_h264_decode_mb_cabac(const H264Context *h, H264SliceContext *sl);
  
-void ff_h264_init_cabac_states(H264Context *h, H264SliceContext *sl);
+void ff_h264_init_cabac_states(const H264Context *h, H264SliceContext *sl);
  
  void h264_init_dequant_tables(H264Context *h);
  
-void ff_h264_direct_dist_scale_factor(H264Context *const h, H264SliceContext *sl);
-void ff_h264_direct_ref_list_init(H264Context *const h, H264SliceContext *sl);
-void ff_h264_pred_direct_motion(H264Context *const h, H264SliceContext *sl,
+void ff_h264_direct_dist_scale_factor(const H264Context *const h, H264SliceContext *sl);
+void ff_h264_direct_ref_list_init(const H264Context *const h, H264SliceContext *sl);
+void ff_h264_pred_direct_motion(const H264Context *const h, H264SliceContext *sl,
                                  int *mb_type);
  
-void ff_h264_filter_mb_fast(H264Context *h, H264SliceContext *sl, int mb_x, int mb_y,
+void ff_h264_filter_mb_fast(const H264Context *h, H264SliceContext *sl, int mb_x, int mb_y,
                              uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr,
                              unsigned int linesize, unsigned int uvlinesize);
-void ff_h264_filter_mb(H264Context *h, H264SliceContext *sl, int mb_x, int mb_y,
+void ff_h264_filter_mb(const H264Context *h, H264SliceContext *sl, int mb_x, int mb_y,
                         uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr,
                         unsigned int linesize, unsigned int uvlinesize);
  
@@ -919,7 +947,7 @@ static av_always_inline uint16_t pack8to16(int a, int b)
  /**
   * Get the chroma qp.
   */
-static av_always_inline int get_chroma_qp(H264Context *h, int t, int qscale)
+static av_always_inline int get_chroma_qp(const H264Context *h, int t, int qscale)
  {
      return h->pps.chroma_qp_table[t][qscale];
  }
@@ -927,7 +955,7 @@ static av_always_inline int get_chroma_qp(H264Context *h, int t, int qscale)
  /**
   * Get the predicted intra4x4 prediction mode.
   */
-static av_always_inline int pred_intra_mode(H264Context *h,
+static av_always_inline int pred_intra_mode(const H264Context *h,
                                              H264SliceContext *sl, int n)
  {
      const int index8 = scan8[n];
@@ -935,7 +963,7 @@ static av_always_inline int pred_intra_mode(H264Context *h,
      const int top    = sl->intra4x4_pred_mode_cache[index8 - 8];
      const int min    = FFMIN(left, top);
  
-    tprintf(h->avctx, "mode:%d %d min:%d\n", left, top, min);
+    ff_tlog(h->avctx, "mode:%d %d min:%d\n", left, top, min);
  
      if (min < 0)
          return DC_PRED;
@@ -943,10 +971,10 @@ static av_always_inline int pred_intra_mode(H264Context *h,
          return min;
  }
  
-static av_always_inline void write_back_intra_pred_mode(H264Context *h,
+static av_always_inline void write_back_intra_pred_mode(const H264Context *h,
                                                          H264SliceContext *sl)
  {
-    int8_t *i4x4       = sl->intra4x4_pred_mode + h->mb2br_xy[h->mb_xy];
+    int8_t *i4x4       = sl->intra4x4_pred_mode + h->mb2br_xy[sl->mb_xy];
      int8_t *i4x4_cache = sl->intra4x4_pred_mode_cache;
  
      AV_COPY32(i4x4, i4x4_cache + 4 + 8 * 4);
@@ -955,10 +983,10 @@ static av_always_inline void write_back_intra_pred_mode(H264Context *h,
      i4x4[6] = i4x4_cache[7 + 8 * 1];
  }
  
-static av_always_inline void write_back_non_zero_count(H264Context *h,
+static av_always_inline void write_back_non_zero_count(const H264Context *h,
                                                         H264SliceContext *sl)
  {
-    const int mb_xy    = h->mb_xy;
+    const int mb_xy    = sl->mb_xy;
      uint8_t *nnz       = h->non_zero_count[mb_xy];
      uint8_t *nnz_cache = sl->non_zero_count_cache;
  
@@ -979,7 +1007,7 @@ static av_always_inline void write_back_non_zero_count(H264Context *h,
      }
  }
  
-static av_always_inline void write_back_motion_list(H264Context *h,
+static av_always_inline void write_back_motion_list(const H264Context *h,
                                                      H264SliceContext *sl,
                                                      int b_stride,
                                                      int b_xy, int b8_xy,
@@ -992,8 +1020,8 @@ static av_always_inline void write_back_motion_list(H264Context *h,
      AV_COPY128(mv_dst + 2 * b_stride, mv_src + 8 * 2);
      AV_COPY128(mv_dst + 3 * b_stride, mv_src + 8 * 3);
      if (CABAC(h)) {
-        uint8_t (*mvd_dst)[2] = &sl->mvd_table[list][FMO ? 8 * h->mb_xy
-                                                        : h->mb2br_xy[h->mb_xy]];
+        uint8_t (*mvd_dst)[2] = &sl->mvd_table[list][FMO ? 8 * sl->mb_xy
+                                                        : h->mb2br_xy[sl->mb_xy]];
          uint8_t(*mvd_src)[2]  = &sl->mvd_cache[list][scan8[0]];
          if (IS_SKIP(mb_type)) {
              AV_ZERO128(mvd_dst);
@@ -1015,13 +1043,13 @@ static av_always_inline void write_back_motion_list(H264Context *h,
      }
  }
  
-static av_always_inline void write_back_motion(H264Context *h,
+static av_always_inline void write_back_motion(const H264Context *h,
                                                 H264SliceContext *sl,
                                                 int mb_type)
  {
      const int b_stride      = h->b_stride;
-    const int b_xy  = 4 * h->mb_x + 4 * h->mb_y * h->b_stride; // try mb2b(8)_xy
-    const int b8_xy = 4 * h->mb_xy;
+    const int b_xy  = 4 * sl->mb_x + 4 * sl->mb_y * h->b_stride; // try mb2b(8)_xy
+    const int b8_xy = 4 * sl->mb_xy;
  
      if (USES_LIST(mb_type, 0)) {
          write_back_motion_list(h, sl, b_stride, b_xy, b8_xy, mb_type, 0);
@@ -1034,7 +1062,7 @@ static av_always_inline void write_back_motion(H264Context *h,
  
      if (sl->slice_type_nos == AV_PICTURE_TYPE_B && CABAC(h)) {
          if (IS_8X8(mb_type)) {
-            uint8_t *direct_table = &h->direct_table[4 * h->mb_xy];
+            uint8_t *direct_table = &h->direct_table[4 * sl->mb_xy];
              direct_table[1] = sl->sub_mb_type[1] >> 1;
              direct_table[2] = sl->sub_mb_type[2] >> 1;
              direct_table[3] = sl->sub_mb_type[3] >> 1;
@@ -1042,7 +1070,7 @@ static av_always_inline void write_back_motion(H264Context *h,
      }
  }
  
-static av_always_inline int get_dct8x8_allowed(H264Context *h, H264SliceContext *sl)
+static av_always_inline int get_dct8x8_allowed(const H264Context *h, H264SliceContext *sl)
  {
      if (h->sps.direct_8x8_inference_flag)
          return !(AV_RN64A(sl->sub_mb_type) &
@@ -1059,21 +1087,20 @@ int ff_h264_field_end(H264Context *h, H264SliceContext *sl, int in_setup);
  int ff_h264_ref_picture(H264Context *h, H264Picture *dst, H264Picture *src);
  void ff_h264_unref_picture(H264Context *h, H264Picture *pic);
  
-int ff_h264_context_init(H264Context *h);
-int ff_h264_set_parameter_from_sps(H264Context *h);
+int ff_h264_slice_context_init(H264Context *h, H264SliceContext *sl);
  
-void ff_h264_draw_horiz_band(H264Context *h, H264SliceContext *sl, int y, int height);
+void ff_h264_draw_horiz_band(const H264Context *h, H264SliceContext *sl, int y, int height);
  int ff_init_poc(H264Context *h, int pic_field_poc[2], int *pic_poc);
  int ff_pred_weight_table(H264Context *h, H264SliceContext *sl);
  int ff_set_ref_count(H264Context *h, H264SliceContext *sl);
  
-int ff_h264_decode_slice_header(H264Context *h, H264SliceContext *sl, H264Context *h0);
+int ff_h264_decode_slice_header(H264Context *h, H264SliceContext *sl);
  int ff_h264_execute_decode_slices(H264Context *h, unsigned context_count);
  int ff_h264_update_thread_context(AVCodecContext *dst,
                                    const AVCodecContext *src);
  
  void ff_h264_flush_change(H264Context *h);
  
-void ff_h264_free_tables(H264Context *h, int free_rbsp);
+void ff_h264_free_tables(H264Context *h);
  
  #endif /* AVCODEC_H264_H */