amrwbdec: set channels, channel_layout, and sample_rate

[ffmpeg] / libavcodec / vorbisdec.c
diff --git a/libavcodec/vorbisdec.c b/libavcodec/vorbisdec.c

index 381b61d060daac57970f8b34f85215154d836bac..f5a541adae436809151d31c1e4fd6ee522c42dab 100644 (file)
--- a/libavcodec/vorbisdec.c
+++ b/libavcodec/vorbisdec.c
@@ -25,7 +25,8 @@
  #include <inttypes.h>
  #include <math.h>
  
-#define ALT_BITSTREAM_READER_LE
+#define BITSTREAM_READER_LE
+#include "libavutil/float_dsp.h"
  #include "avcodec.h"
  #include "get_bits.h"
  #include "dsputil.h"
@@ -124,6 +125,7 @@ typedef struct vorbis_context_s {
      AVFrame frame;
      GetBitContext gb;
      DSPContext dsp;
+    AVFloatDSPContext fdsp;
      FmtConvertContext fmt_conv;
  
      FFTContext mdct[2];
@@ -203,7 +205,7 @@ static void vorbis_free(vorbis_context *vc)
  
      for (i = 0; i < vc->codebook_count; ++i) {
          av_free(vc->codebooks[i].codevectors);
-        free_vlc(&vc->codebooks[i].vlc);
+        ff_free_vlc(&vc->codebooks[i].vlc);
      }
      av_freep(&vc->codebooks);
  
@@ -574,7 +576,11 @@ static int vorbis_parse_setup_hdr_floors(vorbis_context *vc)
              }
  
  // Precalculate order of x coordinates - needed for decode
-            ff_vorbis_ready_floor1_list(floor_setup->data.t1.list, floor_setup->data.t1.x_list_dim);
+            if (ff_vorbis_ready_floor1_list(vc->avccontext,
+                                            floor_setup->data.t1.list,
+                                            floor_setup->data.t1.x_list_dim)) {
+                return AVERROR_INVALIDDATA;
+            }
          } else if (floor_setup->floor_type == 0) {
              unsigned max_codebook_dim = 0;
  
@@ -675,7 +681,7 @@ static int vorbis_parse_setup_hdr_residues(vorbis_context *vc)
          res_setup->partition_size = get_bits(gb, 24) + 1;
          /* Validations to prevent a buffer overflow later. */
          if (res_setup->begin>res_setup->end ||
-            res_setup->end > vc->avccontext->channels * vc->blocksize[1] / 2 ||
+            res_setup->end > (res_setup->type == 2 ? vc->avccontext->channels : 1) * vc->blocksize[1] / 2 ||
              (res_setup->end-res_setup->begin) / res_setup->partition_size > V_MAX_PARTITIONS) {
              av_log(vc->avccontext, AV_LOG_ERROR,
                     "partition out of bounds: type, begin, end, size, blocksize: %"PRIu16", %"PRIu32", %"PRIu32", %u, %"PRIu32"\n",
@@ -816,8 +822,7 @@ static void create_map(vorbis_context *vc, unsigned floor_number)
  
          for (idx = 0; idx < n; ++idx) {
              map[idx] = floor(BARK((vf->rate * idx) / (2.0f * n)) *
-                             ((vf->bark_map_size) /
-                              BARK(vf->rate / 2.0f)));
+                             (vf->bark_map_size / BARK(vf->rate / 2.0f)));
              if (vf->bark_map_size-1 < map[idx])
                  map[idx] = vf->bark_map_size - 1;
          }
@@ -975,11 +980,12 @@ static av_cold int vorbis_decode_init(AVCodecContext *avccontext)
      int headers_len    = avccontext->extradata_size;
      uint8_t *header_start[3];
      int header_len[3];
-    GetBitContext *gb = &(vc->gb);
+    GetBitContext *gb = &vc->gb;
      int hdr_type, ret;
  
      vc->avccontext = avccontext;
-    dsputil_init(&vc->dsp, avccontext);
+    ff_dsputil_init(&vc->dsp, avccontext);
+    avpriv_float_dsp_init(&vc->fdsp, avccontext->flags & CODEC_FLAG_BITEXACT);
      ff_fmt_convert_init(&vc->fmt_conv, avccontext);
  
      if (avccontext->request_sample_fmt == AV_SAMPLE_FMT_FLT) {
@@ -1032,7 +1038,6 @@ static av_cold int vorbis_decode_init(AVCodecContext *avccontext)
  
      avccontext->channels    = vc->audio_channels;
      avccontext->sample_rate = vc->audio_samplerate;
-    avccontext->frame_size  = FFMIN(vc->blocksize[0], vc->blocksize[1]) >> 2;
  
      avcodec_get_frame_defaults(&vc->frame);
      avccontext->coded_frame = &vc->frame;
@@ -1245,20 +1250,20 @@ static int vorbis_floor1_decode(vorbis_context *vc,
              floor1_flag[i]               = 1;
              if (val >= room) {
                  if (highroom > lowroom) {
-                    floor1_Y_final[i] = val - lowroom + predicted;
+                    floor1_Y_final[i] = av_clip_uint16(val - lowroom + predicted);
                  } else {
-                    floor1_Y_final[i] = predicted - val + highroom - 1;
+                    floor1_Y_final[i] = av_clip_uint16(predicted - val + highroom - 1);
                  }
              } else {
                  if (val & 1) {
-                    floor1_Y_final[i] = predicted - (val + 1) / 2;
+                    floor1_Y_final[i] = av_clip_uint16(predicted - (val + 1) / 2);
                  } else {
-                    floor1_Y_final[i] = predicted + val / 2;
+                    floor1_Y_final[i] = av_clip_uint16(predicted + val / 2);
                  }
              }
          } else {
              floor1_flag[i]    = 0;
-            floor1_Y_final[i] = predicted;
+            floor1_Y_final[i] = av_clip_uint16(predicted);
          }
  
          av_dlog(NULL, " Decoded floor(%d) = %u / val %u\n",
@@ -1282,6 +1287,7 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
                                                             uint8_t *do_not_decode,
                                                             float *vec,
                                                             unsigned vlen,
+                                                           unsigned ch_left,
                                                             int vr_type)
  {
      GetBitContext *gb = &vc->gb;
@@ -1289,6 +1295,7 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
      unsigned ptns_to_read = vr->ptns_to_read;
      uint8_t *classifs = vr->classifs;
      unsigned pass, ch_used, i, j, k, l;
+    unsigned max_output = (ch - 1) * vlen;
  
      if (vr_type == 2) {
          for (j = 1; j < ch; ++j)
@@ -1296,8 +1303,15 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
          if (do_not_decode[0])
              return 0;
          ch_used = 1;
+        max_output += vr->end / ch;
      } else {
          ch_used = ch;
+        max_output += vr->end;
+    }
+
+    if (max_output > ch_left * vlen) {
+        av_log(vc->avccontext, AV_LOG_ERROR, "Insufficient output buffer\n");
+        return -1;
      }
  
      av_dlog(NULL, " residue type 0/1/2 decode begin, ch: %d  cpc %d  \n", ch, c_p_c);
@@ -1340,8 +1354,7 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
                          if (vqbook >= 0 && vc->codebooks[vqbook].codevectors) {
                              unsigned coffs;
                              unsigned dim  = vc->codebooks[vqbook].dimensions;
-                            unsigned step = dim == 1 ? vr->partition_size
-                                                     : FASTDIV(vr->partition_size, dim);
+                            unsigned step = FASTDIV(vr->partition_size << 1, dim << 1);
                              vorbis_codebook codebook = vc->codebooks[vqbook];
  
                              if (vr_type == 0) {
@@ -1350,14 +1363,14 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
                                  for (k = 0; k < step; ++k) {
                                      coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
                                      for (l = 0; l < dim; ++l)
-                                        vec[voffs + k + l * step] += codebook.codevectors[coffs + l];  // FPMATH
+                                        vec[voffs + k + l * step] += codebook.codevectors[coffs + l];
                                  }
                              } else if (vr_type == 1) {
                                  voffs = voffset + j * vlen;
                                  for (k = 0; k < step; ++k) {
                                      coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
                                      for (l = 0; l < dim; ++l, ++voffs) {
-                                        vec[voffs]+=codebook.codevectors[coffs+l];  // FPMATH
+                                        vec[voffs]+=codebook.codevectors[coffs+l];
  
                                          av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d  \n",
                                                  pass, voffs, vec[voffs], codebook.codevectors[coffs+l], coffs);
@@ -1369,23 +1382,23 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
                                  if (dim == 2) {
                                      for (k = 0; k < step; ++k) {
                                          coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 2;
-                                        vec[voffs + k       ] += codebook.codevectors[coffs    ];  // FPMATH
-                                        vec[voffs + k + vlen] += codebook.codevectors[coffs + 1];  // FPMATH
+                                        vec[voffs + k       ] += codebook.codevectors[coffs    ];
+                                        vec[voffs + k + vlen] += codebook.codevectors[coffs + 1];
                                      }
                                  } else if (dim == 4) {
                                      for (k = 0; k < step; ++k, voffs += 2) {
                                          coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 4;
-                                        vec[voffs           ] += codebook.codevectors[coffs    ];  // FPMATH
-                                        vec[voffs + 1       ] += codebook.codevectors[coffs + 2];  // FPMATH
-                                        vec[voffs + vlen    ] += codebook.codevectors[coffs + 1];  // FPMATH
-                                        vec[voffs + vlen + 1] += codebook.codevectors[coffs + 3];  // FPMATH
+                                        vec[voffs           ] += codebook.codevectors[coffs    ];
+                                        vec[voffs + 1       ] += codebook.codevectors[coffs + 2];
+                                        vec[voffs + vlen    ] += codebook.codevectors[coffs + 1];
+                                        vec[voffs + vlen + 1] += codebook.codevectors[coffs + 3];
                                      }
                                  } else
                                  for (k = 0; k < step; ++k) {
                                      coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
                                      for (l = 0; l < dim; l += 2, voffs++) {
-                                        vec[voffs       ] += codebook.codevectors[coffs + l    ];  // FPMATH
-                                        vec[voffs + vlen] += codebook.codevectors[coffs + l + 1];  // FPMATH
+                                        vec[voffs       ] += codebook.codevectors[coffs + l    ];
+                                        vec[voffs + vlen] += codebook.codevectors[coffs + l + 1];
  
                                          av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d  \n",
                                                  pass, voffset / ch + (voffs % ch) * vlen,
@@ -1395,17 +1408,24 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
                                  }
  
                              } else if (vr_type == 2) {
-                                voffs = voffset;
+                                unsigned voffs_div = FASTDIV(voffset << 1, ch <<1);
+                                unsigned voffs_mod = voffset - voffs_div * ch;
  
                                  for (k = 0; k < step; ++k) {
                                      coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
-                                    for (l = 0; l < dim; ++l, ++voffs) {
-                                        vec[voffs / ch + (voffs % ch) * vlen] += codebook.codevectors[coffs + l];  // FPMATH FIXME use if and counter instead of / and %
+                                    for (l = 0; l < dim; ++l) {
+                                        vec[voffs_div + voffs_mod * vlen] +=
+                                            codebook.codevectors[coffs + l];
  
                                          av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d  \n",
-                                                pass, voffset / ch + (voffs % ch) * vlen,
-                                                vec[voffset / ch + (voffs % ch) * vlen],
+                                                pass, voffs_div + voffs_mod * vlen,
+                                                vec[voffs_div + voffs_mod * vlen],
                                                  codebook.codevectors[coffs + l], coffs, l);
+
+                                        if (++voffs_mod == ch) {
+                                            voffs_div++;
+                                            voffs_mod = 0;
+                                        }
                                      }
                                  }
                              }
@@ -1424,21 +1444,22 @@ static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
  static inline int vorbis_residue_decode(vorbis_context *vc, vorbis_residue *vr,
                                          unsigned ch,
                                          uint8_t *do_not_decode,
-                                        float *vec, unsigned vlen)
+                                        float *vec, unsigned vlen,
+                                        unsigned ch_left)
  {
      if (vr->type == 2)
-        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 2);
+        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, ch_left, 2);
      else if (vr->type == 1)
-        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 1);
+        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, ch_left, 1);
      else if (vr->type == 0)
-        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 0);
+        return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, ch_left, 0);
      else {
          av_log(vc->avccontext, AV_LOG_ERROR, " Invalid residue type while residue decode?! \n");
          return AVERROR_INVALIDDATA;
      }
  }
  
-void vorbis_inverse_coupling(float *mag, float *ang, int blocksize)
+void ff_vorbis_inverse_coupling(float *mag, float *ang, int blocksize)
  {
      int i;
      for (i = 0;  i < blocksize;  i++) {
@@ -1479,6 +1500,8 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
      uint8_t res_chan[255];
      unsigned res_num = 0;
      int retlen  = 0;
+    unsigned ch_left = vc->audio_channels;
+    unsigned vlen;
  
      if (get_bits1(gb)) {
          av_log(vc->avccontext, AV_LOG_ERROR, "Not a Vorbis I audio packet.\n");
@@ -1498,11 +1521,14 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
  
      blockflag = vc->modes[mode_number].blockflag;
      blocksize = vc->blocksize[blockflag];
-    if (blockflag)
-        skip_bits(gb, 2); // previous_window, next_window
+    vlen = blocksize / 2;
+    if (blockflag) {
+        previous_window = get_bits(gb, 1);
+        skip_bits1(gb); // next_window
+    }
  
-    memset(ch_res_ptr,   0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
-    memset(ch_floor_ptr, 0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
+    memset(ch_res_ptr,   0, sizeof(float) * vc->audio_channels * vlen); //FIXME can this be removed ?
+    memset(ch_floor_ptr, 0, sizeof(float) * vc->audio_channels * vlen); //FIXME can this be removed ?
  
  // Decode floor
  
@@ -1522,7 +1548,7 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
              return AVERROR_INVALIDDATA;
          }
          no_residue[i] = ret;
-        ch_floor_ptr += blocksize / 2;
+        ch_floor_ptr += vlen;
      }
  
  // Nonzero vector propagate
@@ -1539,6 +1565,7 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
      for (i = 0; i < mapping->submaps; ++i) {
          vorbis_residue *residue;
          unsigned ch = 0;
+        int ret;
  
          for (j = 0; j < vc->audio_channels; ++j) {
              if ((mapping->submaps == 1) || (i == mapping->mux[j])) {
@@ -1553,11 +1580,23 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
              }
          }
          residue = &vc->residues[mapping->submap_residue[i]];
-        vorbis_residue_decode(vc, residue, ch, do_not_decode, ch_res_ptr, blocksize/2);
+        if (ch_left < ch) {
+            av_log(vc->avccontext, AV_LOG_ERROR, "Too many channels in vorbis_floor_decode.\n");
+            return -1;
+        }
+        if (ch) {
+            ret = vorbis_residue_decode(vc, residue, ch, do_not_decode, ch_res_ptr, vlen, ch_left);
+            if (ret < 0)
+                return ret;
+        }
  
-        ch_res_ptr += ch * blocksize / 2;
+        ch_res_ptr += ch * vlen;
+        ch_left -= ch;
      }
  
+    if (ch_left > 0)
+        return AVERROR_INVALIDDATA;
+
  // Inverse coupling
  
      for (i = mapping->coupling_steps - 1; i >= 0; --i) { //warning: i has to be signed
@@ -1575,11 +1614,11 @@ static int vorbis_parse_audio_packet(vorbis_context *vc)
      for (j = vc->audio_channels-1;j >= 0; j--) {
          ch_floor_ptr = vc->channel_floors   + j           * blocksize / 2;
          ch_res_ptr   = vc->channel_residues + res_chan[j] * blocksize / 2;
-        vc->dsp.vector_fmul(ch_floor_ptr, ch_floor_ptr, ch_res_ptr, blocksize / 2);
+        vc->fdsp.vector_fmul(ch_floor_ptr, ch_floor_ptr, ch_res_ptr, blocksize / 2);
          mdct->imdct_half(mdct, ch_res_ptr, ch_floor_ptr);
      }
  
-// Overlap/add, save data for next overlapping  FPMATH
+// Overlap/add, save data for next overlapping
  
      retlen = (blocksize + vc->blocksize[previous_window]) / 4;
      for (j = 0; j < vc->audio_channels; j++) {
@@ -1615,7 +1654,7 @@ static int vorbis_decode_frame(AVCodecContext *avccontext, void *data,
      const uint8_t *buf = avpkt->data;
      int buf_size       = avpkt->size;
      vorbis_context *vc = avccontext->priv_data;
-    GetBitContext *gb = &(vc->gb);
+    GetBitContext *gb = &vc->gb;
      const float *channel_ptrs[255];
      int i, len, ret;
  
@@ -1676,19 +1715,30 @@ static av_cold int vorbis_decode_close(AVCodecContext *avccontext)
      return 0;
  }
  
+static av_cold void vorbis_decode_flush(AVCodecContext *avccontext)
+{
+    vorbis_context *vc = avccontext->priv_data;
+
+    if (vc->saved) {
+        memset(vc->saved, 0, (vc->blocksize[1] / 4) * vc->audio_channels *
+                             sizeof(*vc->saved));
+    }
+    vc->previous_window = 0;
+}
+
  AVCodec ff_vorbis_decoder = {
-    .name           = "vorbis",
-    .type           = AVMEDIA_TYPE_AUDIO,
-    .id             = CODEC_ID_VORBIS,
-    .priv_data_size = sizeof(vorbis_context),
-    .init           = vorbis_decode_init,
-    .close          = vorbis_decode_close,
-    .decode         = vorbis_decode_frame,
-    .capabilities   = CODEC_CAP_DR1,
-    .long_name = NULL_IF_CONFIG_SMALL("Vorbis"),
+    .name            = "vorbis",
+    .type            = AVMEDIA_TYPE_AUDIO,
+    .id              = AV_CODEC_ID_VORBIS,
+    .priv_data_size  = sizeof(vorbis_context),
+    .init            = vorbis_decode_init,
+    .close           = vorbis_decode_close,
+    .decode          = vorbis_decode_frame,
+    .flush           = vorbis_decode_flush,
+    .capabilities    = CODEC_CAP_DR1,
+    .long_name       = NULL_IF_CONFIG_SMALL("Vorbis"),
      .channel_layouts = ff_vorbis_channel_layouts,
-    .sample_fmts = (const enum AVSampleFormat[]) {
+    .sample_fmts     = (const enum AVSampleFormat[]) {
          AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_NONE
      },
  };
-