dnxhddata: Fix 10-bit DNxHD quant matrices

[ffmpeg] / libavcodec / proresenc.c
diff --git a/libavcodec/proresenc.c b/libavcodec/proresenc.c

index 51e3783e50b45859b9b1743f6a9ba6495f65857f..0564b12ae29d388d00103776a3f66a30c82f6e73 100644 (file)
--- a/libavcodec/proresenc.c
+++ b/libavcodec/proresenc.c
@@ -23,8 +23,7 @@
  #include "libavutil/opt.h"
  #include "libavutil/pixdesc.h"
  #include "avcodec.h"
-#include "dct.h"
-#include "dsputil.h"
+#include "fdctdsp.h"
  #include "put_bits.h"
  #include "bytestream.h"
  #include "internal.h"
@@ -192,10 +191,11 @@ typedef struct ProresContext {
      const uint8_t *quant_mat;
      const uint8_t *scantable;
  
-    void (* fdct)(DSPContext *dsp, const uint16_t *src,
-                  int linesize, int16_t *block);
-    DSPContext dsp;
+    void (*fdct)(FDCTDSPContext *fdsp, const uint16_t *src,
+                 int linesize, int16_t *block);
+    FDCTDSPContext fdsp;
  
+    const AVFrame *pic;
      int mb_width, mb_height;
      int mbs_per_slice;
      int num_chroma_blocks, chroma_factor;
@@ -207,6 +207,7 @@ typedef struct ProresContext {
      int bits_per_mb;
      int force_quant;
      int alpha_bits;
+    int warn;
  
      char *vendor;
      int quant_sel;
@@ -263,27 +264,27 @@ static void get_slice_data(ProresContext *ctx, const uint16_t *src,
                         mb_width * sizeof(*emu_buf));
          }
          if (!is_chroma) {
-            ctx->fdct(&ctx->dsp, esrc, elinesize, blocks);
+            ctx->fdct(&ctx->fdsp, esrc, elinesize, blocks);
              blocks += 64;
              if (blocks_per_mb > 2) {
-                ctx->fdct(&ctx->dsp, esrc + 8, elinesize, blocks);
+                ctx->fdct(&ctx->fdsp, esrc + 8, elinesize, blocks);
                  blocks += 64;
              }
-            ctx->fdct(&ctx->dsp, esrc + elinesize * 4, elinesize, blocks);
+            ctx->fdct(&ctx->fdsp, esrc + elinesize * 4, elinesize, blocks);
              blocks += 64;
              if (blocks_per_mb > 2) {
-                ctx->fdct(&ctx->dsp, esrc + elinesize * 4 + 8, elinesize, blocks);
+                ctx->fdct(&ctx->fdsp, esrc + elinesize * 4 + 8, elinesize, blocks);
                  blocks += 64;
              }
          } else {
-            ctx->fdct(&ctx->dsp, esrc, elinesize, blocks);
+            ctx->fdct(&ctx->fdsp, esrc, elinesize, blocks);
              blocks += 64;
-            ctx->fdct(&ctx->dsp, esrc + elinesize * 4, elinesize, blocks);
+            ctx->fdct(&ctx->fdsp, esrc + elinesize * 4, elinesize, blocks);
              blocks += 64;
              if (blocks_per_mb > 2) {
-                ctx->fdct(&ctx->dsp, esrc + 8, elinesize, blocks);
+                ctx->fdct(&ctx->fdsp, esrc + 8, elinesize, blocks);
                  blocks += 64;
-                ctx->fdct(&ctx->dsp, esrc + elinesize * 4 + 8, elinesize, blocks);
+                ctx->fdct(&ctx->fdsp, esrc + elinesize * 4 + 8, elinesize, blocks);
                  blocks += 64;
              }
          }
@@ -469,7 +470,6 @@ static void put_alpha_run(PutBitContext *pb, int run)
  
  // todo alpha quantisation for high quants
  static int encode_alpha_plane(ProresContext *ctx, PutBitContext *pb,
-                              const uint16_t *src, int linesize,
                                int mbs_per_slice, uint16_t *blocks,
                                int quant)
  {
@@ -564,11 +564,15 @@ static int encode_slice(AVCodecContext *avctx, const AVFrame *pic,
              get_alpha_data(ctx, src, linesize, xp, yp,
                             pwidth, avctx->height / ctx->pictures_per_frame,
                             ctx->blocks[0], mbs_per_slice, ctx->alpha_bits);
-            sizes[i] = encode_alpha_plane(ctx, pb, src, linesize,
-                                          mbs_per_slice, ctx->blocks[0],
-                                          quant);
+            sizes[i] = encode_alpha_plane(ctx, pb, mbs_per_slice,
+                                          ctx->blocks[0], quant);
          }
          total_size += sizes[i];
+        if (put_bits_left(pb) < 0) {
+            av_log(avctx, AV_LOG_ERROR,
+                   "Underestimated required buffer size.\n");
+            return AVERROR_BUG;
+        }
      }
      return total_size;
  }
@@ -740,7 +744,7 @@ static int estimate_alpha_plane(ProresContext *ctx, int *error,
      return bits;
  }
  
-static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
+static int find_slice_quant(AVCodecContext *avctx,
                              int trellis_node, int x, int y, int mbs_per_slice,
                              ProresThreadData *td)
  {
@@ -762,7 +766,7 @@ static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
      if (ctx->pictures_per_frame == 1)
          line_add = 0;
      else
-        line_add = ctx->cur_picture_idx ^ !pic->top_field_first;
+        line_add = ctx->cur_picture_idx ^ !ctx->pic->top_field_first;
      mbs = x + mbs_per_slice;
  
      for (i = 0; i < ctx->num_planes; i++) {
@@ -782,9 +786,9 @@ static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
              pwidth         = avctx->width >> 1;
          }
  
-        linesize[i] = pic->linesize[i] * ctx->pictures_per_frame;
-        src = (const uint16_t*)(pic->data[i] + yp * linesize[i] +
-                                line_add * pic->linesize[i]) + xp;
+        linesize[i] = ctx->pic->linesize[i] * ctx->pictures_per_frame;
+        src = (const uint16_t *)(ctx->pic->data[i] + yp * linesize[i] +
+                                 line_add * ctx->pic->linesize[i]) + xp;
  
          if (i < 3) {
              get_slice_data(ctx, src, linesize[i], xp, yp,
@@ -817,10 +821,9 @@ static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
          if (ctx->alpha_bits)
              bits += estimate_alpha_plane(ctx, &error, src, linesize[3],
                                           mbs_per_slice, q, td->blocks[3]);
-        if (bits > 65000 * 8) {
+        if (bits > 65000 * 8)
              error = SCORE_LIMIT;
-            break;
-        }
+
          slice_bits[q]  = bits;
          slice_score[q] = error;
      }
@@ -908,7 +911,7 @@ static int find_quant_thread(AVCodecContext *avctx, void *arg,
      for (x = mb = 0; x < ctx->mb_width; x += mbs_per_slice, mb++) {
          while (ctx->mb_width - x < mbs_per_slice)
              mbs_per_slice >>= 1;
-        q = find_slice_quant(avctx, avctx->coded_frame,
+        q = find_slice_quant(avctx,
                               (mb + 1) * TRELLIS_WIDTH, x, y,
                               mbs_per_slice, td);
      }
@@ -932,16 +935,20 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
      int sizes[4] = { 0 };
      int slice_hdr_size = 2 + 2 * (ctx->num_planes - 1);
      int frame_size, picture_size, slice_size;
-    int pkt_size, ret;
+    int pkt_size, ret, max_slice_size = 0;
      uint8_t frame_flags;
  
-    *avctx->coded_frame           = *pic;
+    ctx->pic = pic;
+#if FF_API_CODED_FRAME
+FF_DISABLE_DEPRECATION_WARNINGS
      avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
      avctx->coded_frame->key_frame = 1;
+FF_ENABLE_DEPRECATION_WARNINGS
+#endif
  
-    pkt_size = ctx->frame_size_upper_bound + FF_MIN_BUFFER_SIZE;
+    pkt_size = ctx->frame_size_upper_bound;
  
-    if ((ret = ff_alloc_packet(pkt, pkt_size)) < 0) {
+    if ((ret = ff_alloc_packet(pkt, pkt_size + AV_INPUT_BUFFER_MIN_SIZE)) < 0) {
          av_log(avctx, AV_LOG_ERROR, "Error getting output packet.\n");
          return ret;
      }
@@ -962,7 +969,7 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
      bytestream_put_be16  (&buf, avctx->height);
  
      frame_flags = ctx->chroma_factor << 6;
-    if (avctx->flags & CODEC_FLAG_INTERLACED_DCT)
+    if (avctx->flags & AV_CODEC_FLAG_INTERLACED_DCT)
          frame_flags |= pic->top_field_first ? 0x04 : 0x08;
      bytestream_put_byte  (&buf, frame_flags);
  
@@ -1019,8 +1026,44 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                  bytestream_put_byte(&buf, slice_hdr_size << 3);
                  slice_hdr = buf;
                  buf += slice_hdr_size - 1;
+                if (pkt_size <= buf - orig_buf + 2 * max_slice_size) {
+                    uint8_t *start = pkt->data;
+                    // Recompute new size according to max_slice_size
+                    // and deduce delta
+                    int delta = 200 + ctx->pictures_per_frame *
+                                ctx->slices_per_picture * max_slice_size -
+                                pkt_size;
+
+                    delta = FFMAX(delta, 2 * max_slice_size);
+                    ctx->frame_size_upper_bound += delta;
+
+                    if (!ctx->warn) {
+                        avpriv_request_sample(avctx,
+                                              "Packet too small: is %i,"
+                                              " needs %i (slice: %i). "
+                                              "Correct allocation",
+                                              pkt_size, delta, max_slice_size);
+                        ctx->warn = 1;
+                    }
+
+                    ret = av_grow_packet(pkt, delta);
+                    if (ret < 0)
+                        return ret;
+
+                    pkt_size += delta;
+                    // restore pointers
+                    orig_buf         = pkt->data + (orig_buf         - start);
+                    buf              = pkt->data + (buf              - start);
+                    picture_size_pos = pkt->data + (picture_size_pos - start);
+                    slice_sizes      = pkt->data + (slice_sizes      - start);
+                    slice_hdr        = pkt->data + (slice_hdr        - start);
+                    tmp              = pkt->data + (tmp              - start);
+                }
                  init_put_bits(&pb, buf, (pkt_size - (buf - orig_buf)) * 8);
-                encode_slice(avctx, pic, &pb, sizes, x, y, q, mbs_per_slice);
+                ret = encode_slice(avctx, pic, &pb, sizes, x, y, q,
+                                   mbs_per_slice);
+                if (ret < 0)
+                    return ret;
  
                  bytestream_put_byte(&slice_hdr, q);
                  slice_size = slice_hdr_size + sizes[ctx->num_planes - 1];
@@ -1030,6 +1073,8 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                  }
                  bytestream_put_be16(&slice_sizes, slice_size);
                  buf += slice_size - slice_hdr_size;
+                if (max_slice_size < slice_size)
+                    max_slice_size = slice_size;
              }
          }
  
@@ -1056,8 +1101,6 @@ static av_cold int encode_close(AVCodecContext *avctx)
      ProresContext *ctx = avctx->priv_data;
      int i;
  
-    av_freep(&avctx->coded_frame);
-
      if (ctx->tdata) {
          for (i = 0; i < avctx->thread_count; i++)
              av_free(ctx->tdata[i].nodes);
@@ -1068,7 +1111,7 @@ static av_cold int encode_close(AVCodecContext *avctx)
      return 0;
  }
  
-static void prores_fdct(DSPContext *dsp, const uint16_t *src,
+static void prores_fdct(FDCTDSPContext *fdsp, const uint16_t *src,
                          int linesize, int16_t *block)
  {
      int x, y;
@@ -1079,7 +1122,7 @@ static void prores_fdct(DSPContext *dsp, const uint16_t *src,
              block[y * 8 + x] = tsrc[x];
          tsrc += linesize >> 1;
      }
-    dsp->fdct(block);
+    fdsp->fdct(block);
  }
  
  static av_cold int encode_init(AVCodecContext *avctx)
@@ -1088,17 +1131,14 @@ static av_cold int encode_init(AVCodecContext *avctx)
      int mps;
      int i, j;
      int min_quant, max_quant;
-    int interlaced = !!(avctx->flags & CODEC_FLAG_INTERLACED_DCT);
+    int interlaced = !!(avctx->flags & AV_CODEC_FLAG_INTERLACED_DCT);
  
      avctx->bits_per_raw_sample = 10;
-    avctx->coded_frame = av_frame_alloc();
-    if (!avctx->coded_frame)
-        return AVERROR(ENOMEM);
  
      ctx->fdct      = prores_fdct;
      ctx->scantable = interlaced ? ff_prores_interlaced_scan
                                  : ff_prores_progressive_scan;
-    ff_dsputil_init(&ctx->dsp, avctx);
+    ff_fdctdsp_init(&ctx->fdsp, avctx);
  
      mps = ctx->mbs_per_slice;
      if (mps & (mps - 1)) {
@@ -1111,6 +1151,7 @@ static av_cold int encode_init(AVCodecContext *avctx)
              av_log(avctx, AV_LOG_ERROR, "alpha bits should be 0, 8 or 16\n");
              return AVERROR(EINVAL);
          }
+        avctx->bits_per_coded_sample = 32;
      } else {
          ctx->alpha_bits = 0;
      }
@@ -1205,8 +1246,6 @@ static av_cold int encode_init(AVCodecContext *avctx)
          ctx->bits_per_mb = ls * 8;
          if (ctx->chroma_factor == CFACTOR_Y444)
              ctx->bits_per_mb += ls * 4;
-        if (ctx->num_planes == 4)
-            ctx->bits_per_mb += ls * 4;
      }
  
      ctx->frame_size_upper_bound = ctx->pictures_per_frame *
@@ -1215,6 +1254,14 @@ static av_cold int encode_init(AVCodecContext *avctx)
                                     (mps * ctx->bits_per_mb) / 8)
                                    + 200;
  
+    if (ctx->alpha_bits) {
+         // The alpha plane is run-coded and might exceed the bit budget.
+         ctx->frame_size_upper_bound += ctx->pictures_per_frame *
+                                        ctx->slices_per_picture *
+         /* num pixels per slice */     (ctx->mbs_per_slice * 256 *
+         /* bits per pixel */            (1 + ctx->alpha_bits + 1) + 7 >> 3);
+    }
+
      avctx->codec_tag   = ctx->profile_info->tag;
  
      av_log(avctx, AV_LOG_DEBUG,
@@ -1285,7 +1332,7 @@ AVCodec ff_prores_encoder = {
      .init           = encode_init,
      .close          = encode_close,
      .encode2        = encode_frame,
-    .capabilities   = CODEC_CAP_SLICE_THREADS,
+    .capabilities   = AV_CODEC_CAP_SLICE_THREADS,
      .pix_fmts       = (const enum AVPixelFormat[]) {
                            AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10,
                            AV_PIX_FMT_YUVA444P10, AV_PIX_FMT_NONE