Add approved chunks to AAC encoder

[ffmpeg] / libavcodec / mpegaudiodec.c
diff --git a/libavcodec/mpegaudiodec.c b/libavcodec/mpegaudiodec.c

index bfd54d535ab579337b4a4c2abe8187778f4e0372..61e0c6fbd6d551d957e9988eefe09ddc3fcdd27c 100644 (file)
--- a/libavcodec/mpegaudiodec.c
+++ b/libavcodec/mpegaudiodec.c
@@ -46,9 +46,6 @@
  
  #include "mathops.h"
  
-#define FRAC_ONE    (1 << FRAC_BITS)
-
-#define FIX(a)   ((int)((a) * FRAC_ONE))
  /* WARNING: only correct for posititive numbers */
  #define FIXR(a)   ((int)((a) * FRAC_ONE + 0.5))
  #define FRAC_RND(a) (((a) + (FRAC_ONE/2)) >> FRAC_BITS)
@@ -59,15 +56,6 @@
  
  #define HEADER_SIZE 4
  
-/**
- * Context for MP3On4 decoder
- */
-typedef struct MP3On4DecodeContext {
-    int frames;   ///< number of mp3 frames per block (number of mp3 decoder instances)
-    int chan_cfg; ///< channel config number
-    MPADecodeContext *mp3decctx[5]; ///< MPADecodeContext for every decoder instance
-} MP3On4DecodeContext;
-
  /* layer 3 "granule" */
  typedef struct GranuleDef {
      uint8_t scfsi;
@@ -88,16 +76,6 @@ typedef struct GranuleDef {
      int32_t sb_hybrid[SBLIMIT * 18]; /* 576 samples */
  } GranuleDef;
  
-#define MODE_EXT_MS_STEREO 2
-#define MODE_EXT_I_STEREO  1
-
-/* layer 3 huffman tables */
-typedef struct HuffTable {
-    int xsize;
-    const uint8_t *bits;
-    const uint16_t *codes;
-} HuffTable;
-
  #include "mpegaudiodata.h"
  #include "mpegaudiodectab.h"
  
@@ -106,7 +84,19 @@ static void compute_antialias_float(MPADecodeContext *s, GranuleDef *g);
  
  /* vlc structure for decoding layer 3 huffman tables */
  static VLC huff_vlc[16];
+static VLC_TYPE huff_vlc_tables[
+  0+128+128+128+130+128+154+166+
+  142+204+190+170+542+460+662+414
+  ][2];
+static const int huff_vlc_tables_sizes[16] = {
+  0, 128, 128, 128, 130, 128, 154, 166,
+  142, 204, 190, 170, 542, 460, 662, 414
+};
  static VLC huff_quad_vlc[2];
+static VLC_TYPE huff_quad_vlc_tables[128+16][2];
+static const int huff_quad_vlc_tables_sizes[2] = {
+  128, 16
+};
  /* computed from band_size_long */
  static uint16_t band_index_long[9][23];
  /* XXX: free when all decoders are closed */
@@ -139,6 +129,68 @@ static const int32_t scale_factor_mult2[3][3] = {
  
  static DECLARE_ALIGNED_16(MPA_INT, window[512]);
  
+/**
+ * Convert region offsets to region sizes and truncate
+ * size to big_values.
+ */
+void ff_region_offset2size(GranuleDef *g){
+    int i, k, j=0;
+    g->region_size[2] = (576 / 2);
+    for(i=0;i<3;i++) {
+        k = FFMIN(g->region_size[i], g->big_values);
+        g->region_size[i] = k - j;
+        j = k;
+    }
+}
+
+void ff_init_short_region(MPADecodeContext *s, GranuleDef *g){
+    if (g->block_type == 2)
+        g->region_size[0] = (36 / 2);
+    else {
+        if (s->sample_rate_index <= 2)
+            g->region_size[0] = (36 / 2);
+        else if (s->sample_rate_index != 8)
+            g->region_size[0] = (54 / 2);
+        else
+            g->region_size[0] = (108 / 2);
+    }
+    g->region_size[1] = (576 / 2);
+}
+
+void ff_init_long_region(MPADecodeContext *s, GranuleDef *g, int ra1, int ra2){
+    int l;
+    g->region_size[0] =
+        band_index_long[s->sample_rate_index][ra1 + 1] >> 1;
+    /* should not overflow */
+    l = FFMIN(ra1 + ra2 + 2, 22);
+    g->region_size[1] =
+        band_index_long[s->sample_rate_index][l] >> 1;
+}
+
+void ff_compute_band_indexes(MPADecodeContext *s, GranuleDef *g){
+    if (g->block_type == 2) {
+        if (g->switch_point) {
+            /* if switched mode, we handle the 36 first samples as
+                long blocks.  For 8000Hz, we handle the 48 first
+                exponents as long blocks (XXX: check this!) */
+            if (s->sample_rate_index <= 2)
+                g->long_end = 8;
+            else if (s->sample_rate_index != 8)
+                g->long_end = 6;
+            else
+                g->long_end = 4; /* 8000 Hz */
+
+            g->short_start = 2 + (s->sample_rate_index != 8);
+        } else {
+            g->long_end = 0;
+            g->short_start = 0;
+        }
+    } else {
+        g->short_start = 13;
+        g->long_end = 22;
+    }
+}
+
  /* layer 1 unscaling */
  /* n = number of bits of the mantissa minus 1 */
  static inline int l1_unscale(int n, int mant, int scale_factor)
@@ -284,6 +336,8 @@ static int decode_init(AVCodecContext * avctx)
          s->compute_antialias= compute_antialias_float;
  
      if (!init && !avctx->parse_only) {
+        int offset;
+
          /* scale factors table for layer 1/2 */
          for(i=0;i<64;i++) {
              int shift, mod;
@@ -311,6 +365,7 @@ static int decode_init(AVCodecContext * avctx)
          ff_mpa_synth_init(window);
  
          /* huffman decode tables */
+        offset = 0;
          for(i=1;i<16;i++) {
              const HuffTable *h = &mpa_huff_tables[i];
              int xsize, x, y;
@@ -333,13 +388,25 @@ static int decode_init(AVCodecContext * avctx)
              }
  
              /* XXX: fail test */
+            huff_vlc[i].table = huff_vlc_tables+offset;
+            huff_vlc[i].table_allocated = huff_vlc_tables_sizes[i];
              init_vlc(&huff_vlc[i], 7, 512,
-                     tmp_bits, 1, 1, tmp_codes, 2, 2, 1);
+                     tmp_bits, 1, 1, tmp_codes, 2, 2,
+                     INIT_VLC_USE_NEW_STATIC);
+            offset += huff_vlc_tables_sizes[i];
          }
+        assert(offset == sizeof(huff_vlc_tables)/(sizeof(VLC_TYPE)*2));
+
+        offset = 0;
          for(i=0;i<2;i++) {
+            huff_quad_vlc[i].table = huff_quad_vlc_tables+offset;
+            huff_quad_vlc[i].table_allocated = huff_quad_vlc_tables_sizes[i];
              init_vlc(&huff_quad_vlc[i], i == 0 ? 7 : 4, 16,
-                     mpa_quad_bits[i], 1, 1, mpa_quad_codes[i], 1, 1, 1);
+                     mpa_quad_bits[i], 1, 1, mpa_quad_codes[i], 1, 1,
+                     INIT_VLC_USE_NEW_STATIC);
+            offset += huff_quad_vlc_tables_sizes[i];
          }
+        assert(offset == sizeof(huff_quad_vlc_tables)/(sizeof(VLC_TYPE)*2));
  
          for(i=0;i<9;i++) {
              k = 0;
@@ -726,6 +793,8 @@ static inline int round_sample(int *sum)
  /* signed 16x16 -> 32 multiply */
  #define MULS(ra, rb) MUL16(ra, rb)
  
+#define MLSS(rt, ra, rb) MLS16(rt, ra, rb)
+
  #else
  
  static inline int round_sample(int64_t *sum)
@@ -741,47 +810,49 @@ static inline int round_sample(int64_t *sum)
  }
  
  #   define MULS(ra, rb) MUL64(ra, rb)
+#   define MACS(rt, ra, rb) MAC64(rt, ra, rb)
+#   define MLSS(rt, ra, rb) MLS64(rt, ra, rb)
  #endif
  
-#define SUM8(sum, op, w, p) \
-{                                               \
-    sum op MULS((w)[0 * 64], p[0 * 64]);\
-    sum op MULS((w)[1 * 64], p[1 * 64]);\
-    sum op MULS((w)[2 * 64], p[2 * 64]);\
-    sum op MULS((w)[3 * 64], p[3 * 64]);\
-    sum op MULS((w)[4 * 64], p[4 * 64]);\
-    sum op MULS((w)[5 * 64], p[5 * 64]);\
-    sum op MULS((w)[6 * 64], p[6 * 64]);\
-    sum op MULS((w)[7 * 64], p[7 * 64]);\
+#define SUM8(op, sum, w, p)               \
+{                                         \
+    op(sum, (w)[0 * 64], p[0 * 64]);      \
+    op(sum, (w)[1 * 64], p[1 * 64]);      \
+    op(sum, (w)[2 * 64], p[2 * 64]);      \
+    op(sum, (w)[3 * 64], p[3 * 64]);      \
+    op(sum, (w)[4 * 64], p[4 * 64]);      \
+    op(sum, (w)[5 * 64], p[5 * 64]);      \
+    op(sum, (w)[6 * 64], p[6 * 64]);      \
+    op(sum, (w)[7 * 64], p[7 * 64]);      \
  }
  
  #define SUM8P2(sum1, op1, sum2, op2, w1, w2, p) \
  {                                               \
      int tmp;\
      tmp = p[0 * 64];\
-    sum1 op1 MULS((w1)[0 * 64], tmp);\
-    sum2 op2 MULS((w2)[0 * 64], tmp);\
+    op1(sum1, (w1)[0 * 64], tmp);\
+    op2(sum2, (w2)[0 * 64], tmp);\
      tmp = p[1 * 64];\
-    sum1 op1 MULS((w1)[1 * 64], tmp);\
-    sum2 op2 MULS((w2)[1 * 64], tmp);\
+    op1(sum1, (w1)[1 * 64], tmp);\
+    op2(sum2, (w2)[1 * 64], tmp);\
      tmp = p[2 * 64];\
-    sum1 op1 MULS((w1)[2 * 64], tmp);\
-    sum2 op2 MULS((w2)[2 * 64], tmp);\
+    op1(sum1, (w1)[2 * 64], tmp);\
+    op2(sum2, (w2)[2 * 64], tmp);\
      tmp = p[3 * 64];\
-    sum1 op1 MULS((w1)[3 * 64], tmp);\
-    sum2 op2 MULS((w2)[3 * 64], tmp);\
+    op1(sum1, (w1)[3 * 64], tmp);\
+    op2(sum2, (w2)[3 * 64], tmp);\
      tmp = p[4 * 64];\
-    sum1 op1 MULS((w1)[4 * 64], tmp);\
-    sum2 op2 MULS((w2)[4 * 64], tmp);\
+    op1(sum1, (w1)[4 * 64], tmp);\
+    op2(sum2, (w2)[4 * 64], tmp);\
      tmp = p[5 * 64];\
-    sum1 op1 MULS((w1)[5 * 64], tmp);\
-    sum2 op2 MULS((w2)[5 * 64], tmp);\
+    op1(sum1, (w1)[5 * 64], tmp);\
+    op2(sum2, (w2)[5 * 64], tmp);\
      tmp = p[6 * 64];\
-    sum1 op1 MULS((w1)[6 * 64], tmp);\
-    sum2 op2 MULS((w2)[6 * 64], tmp);\
+    op1(sum1, (w1)[6 * 64], tmp);\
+    op2(sum2, (w2)[6 * 64], tmp);\
      tmp = p[7 * 64];\
-    sum1 op1 MULS((w1)[7 * 64], tmp);\
-    sum2 op2 MULS((w2)[7 * 64], tmp);\
+    op1(sum1, (w1)[7 * 64], tmp);\
+    op2(sum2, (w2)[7 * 64], tmp);\
  }
  
  void ff_mpa_synth_init(MPA_INT *window)
@@ -832,10 +903,7 @@ void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
  #if FRAC_BITS <= 15
          /* NOTE: can cause a loss in precision if very high amplitude
             sound */
-        if (v > 32767)
-            v = 32767;
-        else if (v < -32768)
-            v = -32768;
+        v = av_clip_int16(v);
  #endif
          synth_buf[j] = v;
      }
@@ -848,9 +916,9 @@ void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
  
      sum = *dither_state;
      p = synth_buf + 16;
-    SUM8(sum, +=, w, p);
+    SUM8(MACS, sum, w, p);
      p = synth_buf + 48;
-    SUM8(sum, -=, w + 32, p);
+    SUM8(MLSS, sum, w + 32, p);
      *samples = round_sample(&sum);
      samples += incr;
      w++;
@@ -860,9 +928,9 @@ void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
      for(j=1;j<16;j++) {
          sum2 = 0;
          p = synth_buf + 16 + j;
-        SUM8P2(sum, +=, sum2, -=, w, w2, p);
+        SUM8P2(sum, MACS, sum2, MLSS, w, w2, p);
          p = synth_buf + 48 - j;
-        SUM8P2(sum, -=, sum2, -=, w + 32, w2 + 32, p);
+        SUM8P2(sum, MLSS, sum2, MLSS, w + 32, w2 + 32, p);
  
          *samples = round_sample(&sum);
          samples += incr;
@@ -874,7 +942,7 @@ void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
      }
  
      p = synth_buf + 32;
-    SUM8(sum, -=, w + 32, p);
+    SUM8(MLSS, sum, w + 32, p);
      *samples = round_sample(&sum);
      *dither_state= sum;
  
@@ -1536,7 +1604,7 @@ static int huffman_decode(MPADecodeContext *s, GranuleDef *g,
                     part. We must go back into the data */
                  s_index -= 4;
                  skip_bits_long(&s->gb, last_pos - pos);
-                av_log(NULL, AV_LOG_INFO, "overread, skip %d enddists: %d %d\n", last_pos - pos, end_pos-pos, end_pos2-pos);
+                av_log(s->avctx, AV_LOG_INFO, "overread, skip %d enddists: %d %d\n", last_pos - pos, end_pos-pos, end_pos2-pos);
                  if(s->error_resilience >= FF_ER_COMPLIANT)
                      s_index=0;
                  break;
@@ -1572,10 +1640,10 @@ static int huffman_decode(MPADecodeContext *s, GranuleDef *g,
      bits_left = end_pos2 - get_bits_count(&s->gb);
  //av_log(NULL, AV_LOG_ERROR, "left:%d buf:%p\n", bits_left, s->in_gb.buffer);
      if (bits_left < 0/* || bits_left > 500*/) {
-        av_log(NULL, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
+        av_log(s->avctx, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
          s_index=0;
      }else if(bits_left > 0 && s->error_resilience >= FF_ER_AGGRESSIVE){
-        av_log(NULL, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
+        av_log(s->avctx, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
          s_index=0;
      }
      memset(&g->sb_hybrid[s_index], 0, sizeof(*g->sb_hybrid)*(576 - s_index));
@@ -2012,32 +2080,21 @@ static int mp_decode_layer3(MPADecodeContext *s)
                  g->scalefac_compress = get_bits(&s->gb, 9);
              else
                  g->scalefac_compress = get_bits(&s->gb, 4);
-            blocksplit_flag = get_bits(&s->gb, 1);
+            blocksplit_flag = get_bits1(&s->gb);
              if (blocksplit_flag) {
                  g->block_type = get_bits(&s->gb, 2);
                  if (g->block_type == 0){
-                    av_log(NULL, AV_LOG_ERROR, "invalid block type\n");
+                    av_log(s->avctx, AV_LOG_ERROR, "invalid block type\n");
                      return -1;
                  }
-                g->switch_point = get_bits(&s->gb, 1);
+                g->switch_point = get_bits1(&s->gb);
                  for(i=0;i<2;i++)
                      g->table_select[i] = get_bits(&s->gb, 5);
                  for(i=0;i<3;i++)
                      g->subblock_gain[i] = get_bits(&s->gb, 3);
-                /* compute huffman coded region sizes */
-                if (g->block_type == 2)
-                    g->region_size[0] = (36 / 2);
-                else {
-                    if (s->sample_rate_index <= 2)
-                        g->region_size[0] = (36 / 2);
-                    else if (s->sample_rate_index != 8)
-                        g->region_size[0] = (54 / 2);
-                    else
-                        g->region_size[0] = (108 / 2);
-                }
-                g->region_size[1] = (576 / 2);
+                ff_init_short_region(s, g);
              } else {
-                int region_address1, region_address2, l;
+                int region_address1, region_address2;
                  g->block_type = 0;
                  g->switch_point = 0;
                  for(i=0;i<3;i++)
@@ -2047,53 +2104,16 @@ static int mp_decode_layer3(MPADecodeContext *s)
                  region_address2 = get_bits(&s->gb, 3);
                  dprintf(s->avctx, "region1=%d region2=%d\n",
                          region_address1, region_address2);
-                g->region_size[0] =
-                    band_index_long[s->sample_rate_index][region_address1 + 1] >> 1;
-                l = region_address1 + region_address2 + 2;
-                /* should not overflow */
-                if (l > 22)
-                    l = 22;
-                g->region_size[1] =
-                    band_index_long[s->sample_rate_index][l] >> 1;
-            }
-            /* convert region offsets to region sizes and truncate
-               size to big_values */
-            g->region_size[2] = (576 / 2);
-            j = 0;
-            for(i=0;i<3;i++) {
-                k = FFMIN(g->region_size[i], g->big_values);
-                g->region_size[i] = k - j;
-                j = k;
-            }
-
-            /* compute band indexes */
-            if (g->block_type == 2) {
-                if (g->switch_point) {
-                    /* if switched mode, we handle the 36 first samples as
-                       long blocks.  For 8000Hz, we handle the 48 first
-                       exponents as long blocks (XXX: check this!) */
-                    if (s->sample_rate_index <= 2)
-                        g->long_end = 8;
-                    else if (s->sample_rate_index != 8)
-                        g->long_end = 6;
-                    else
-                        g->long_end = 4; /* 8000 Hz */
-
-                    g->short_start = 2 + (s->sample_rate_index != 8);
-                } else {
-                    g->long_end = 0;
-                    g->short_start = 0;
-                }
-            } else {
-                g->short_start = 13;
-                g->long_end = 22;
+                ff_init_long_region(s, g, region_address1, region_address2);
              }
+            ff_region_offset2size(g);
+            ff_compute_band_indexes(s, g);
  
              g->preflag = 0;
              if (!s->lsf)
-                g->preflag = get_bits(&s->gb, 1);
-            g->scalefac_scale = get_bits(&s->gb, 1);
-            g->count1table_select = get_bits(&s->gb, 1);
+                g->preflag = get_bits1(&s->gb);
+            g->scalefac_scale = get_bits1(&s->gb);
+            g->count1table_select = get_bits1(&s->gb);
              dprintf(s->avctx, "block_type=%d switch_point=%d\n",
                      g->block_type, g->switch_point);
          }
@@ -2116,7 +2136,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
          for(ch=0;ch<s->nb_channels;ch++) {
              g = &granules[ch][gr];
              if(get_bits_count(&s->gb)<0){
-                av_log(NULL, AV_LOG_ERROR, "mdb:%d, lastbuf:%d skipping granule %d\n",
+                av_log(s->avctx, AV_LOG_ERROR, "mdb:%d, lastbuf:%d skipping granule %d\n",
                                              main_data_begin, s->last_buf_size, gr);
                  skip_bits_long(&s->gb, g->part2_3_length);
                  memset(g->sb_hybrid, 0, sizeof(g->sb_hybrid));
@@ -2298,17 +2318,20 @@ static int mp_decode_frame(MPADecodeContext *s,
  
      /* skip error protection field */
      if (s->error_protection)
-        get_bits(&s->gb, 16);
+        skip_bits(&s->gb, 16);
  
      dprintf(s->avctx, "frame %d:\n", s->frame_count);
      switch(s->layer) {
      case 1:
+        s->avctx->frame_size = 384;
          nb_frames = mp_decode_layer1(s);
          break;
      case 2:
+        s->avctx->frame_size = 1152;
          nb_frames = mp_decode_layer2(s);
          break;
      case 3:
+        s->avctx->frame_size = s->lsf ? 576 : 1152;
      default:
          nb_frames = mp_decode_layer3(s);
  
@@ -2320,7 +2343,7 @@ static int mp_decode_frame(MPADecodeContext *s,
                  memmove(s->last_buf, s->gb.buffer + (get_bits_count(&s->gb)>>3), i);
                  s->last_buf_size=i;
              }else
-                av_log(NULL, AV_LOG_ERROR, "invalid old backstep %d\n", i);
+                av_log(s->avctx, AV_LOG_ERROR, "invalid old backstep %d\n", i);
              s->gb= s->in_gb;
              s->in_gb.buffer= NULL;
          }
@@ -2330,7 +2353,7 @@ static int mp_decode_frame(MPADecodeContext *s,
          i= (s->gb.size_in_bits - get_bits_count(&s->gb))>>3;
  
          if(i<0 || i > BACKSTEP_SIZE || nb_frames<0){
-            av_log(NULL, AV_LOG_ERROR, "invalid new backstep %d\n", i);
+            av_log(s->avctx, AV_LOG_WARNING, "invalid new backstep %d\n", i);
              i= FFMIN(BACKSTEP_SIZE, buf_size - HEADER_SIZE);
          }
          assert(i <= buf_size - HEADER_SIZE && i>= 0);
@@ -2369,7 +2392,7 @@ static int mp_decode_frame(MPADecodeContext *s,
  
  static int decode_frame(AVCodecContext * avctx,
                          void *data, int *data_size,
-                        uint8_t * buf, int buf_size)
+                        const uint8_t * buf, int buf_size)
  {
      MPADecodeContext *s = avctx->priv_data;
      uint32_t header;
@@ -2380,7 +2403,7 @@ retry:
      if(buf_size < HEADER_SIZE)
          return -1;
  
-    header = (buf[0] << 24) | (buf[1] << 16) | (buf[2] << 8) | buf[3];
+    header = AV_RB32(buf);
      if(ff_mpa_check_header(header) < 0){
          buf++;
  //        buf_size--;
@@ -2397,26 +2420,13 @@ retry:
      avctx->channels = s->nb_channels;
      avctx->bit_rate = s->bit_rate;
      avctx->sub_id = s->layer;
-    switch(s->layer) {
-    case 1:
-        avctx->frame_size = 384;
-        break;
-    case 2:
-        avctx->frame_size = 1152;
-        break;
-    case 3:
-        if (s->lsf)
-            avctx->frame_size = 576;
-        else
-            avctx->frame_size = 1152;
-        break;
-    }
  
      if(s->frame_size<=0 || s->frame_size > buf_size){
          av_log(avctx, AV_LOG_ERROR, "incomplete frame\n");
          return -1;
      }else if(s->frame_size < buf_size){
          av_log(avctx, AV_LOG_ERROR, "incorrect frame size\n");
+        buf_size= s->frame_size;
      }
  
      out_size = mp_decode_frame(s, out_samples, buf, buf_size);
@@ -2432,13 +2442,14 @@ retry:
  
  static void flush(AVCodecContext *avctx){
      MPADecodeContext *s = avctx->priv_data;
+    memset(s->synth_buf, 0, sizeof(s->synth_buf));
      s->last_buf_size= 0;
  }
  
  #ifdef CONFIG_MP3ADU_DECODER
  static int decode_frame_adu(AVCodecContext * avctx,
                          void *data, int *data_size,
-                        uint8_t * buf, int buf_size)
+                        const uint8_t * buf, int buf_size)
  {
      MPADecodeContext *s = avctx->priv_data;
      uint32_t header;
@@ -2458,7 +2469,7 @@ static int decode_frame_adu(AVCodecContext * avctx,
          len = MPA_MAX_CODED_FRAME_SIZE;
  
      // Get header and restore sync word
-    header = (buf[0] << 24) | (buf[1] << 16) | (buf[2] << 8) | buf[3] | 0xffe00000;
+    header = AV_RB32(buf) | 0xffe00000;
  
      if (ff_mpa_check_header(header) < 0) { // Bad header, discard frame
          *data_size = 0;
@@ -2472,7 +2483,7 @@ static int decode_frame_adu(AVCodecContext * avctx,
      avctx->bit_rate = s->bit_rate;
      avctx->sub_id = s->layer;
  
-    avctx->frame_size=s->frame_size = len;
+    s->frame_size = len;
  
      if (avctx->parse_only) {
          out_size = buf_size;
@@ -2486,11 +2497,23 @@ static int decode_frame_adu(AVCodecContext * avctx,
  #endif /* CONFIG_MP3ADU_DECODER */
  
  #ifdef CONFIG_MP3ON4_DECODER
+
+/**
+ * Context for MP3On4 decoder
+ */
+typedef struct MP3On4DecodeContext {
+    int frames;   ///< number of mp3 frames per block (number of mp3 decoder instances)
+    int syncword; ///< syncword patch
+    const uint8_t *coff; ///< channels offsets in output buffer
+    MPADecodeContext *mp3decctx[5]; ///< MPADecodeContext for every decoder instance
+} MP3On4DecodeContext;
+
+#include "mpeg4audio.h"
+
  /* Next 3 arrays are indexed by channel config number (passed via codecdata) */
-static int mp3Frames[16] = {0,1,1,2,3,3,4,5,2};   /* number of mp3 decoder instances */
-static int mp3Channels[16] = {0,1,2,3,4,5,6,8,4}; /* total output channels */
+static const uint8_t mp3Frames[8] = {0,1,1,2,3,3,4,5};   /* number of mp3 decoder instances */
  /* offsets into output buffer, assume output order is FL FR BL BR C LFE */
-static int chan_offset[9][5] = {
+static const uint8_t chan_offset[8][5] = {
      {0},
      {0},            // C
      {0},            // FLR
@@ -2499,13 +2522,13 @@ static int chan_offset[9][5] = {
      {4,0,2},        // C FLR BLRS
      {4,0,2,5},      // C FLR BLRS LFE
      {4,0,2,6,5},    // C FLR BLRS BLR LFE
-    {0,2}           // FLR BLRS
  };
  
  
  static int decode_init_mp3on4(AVCodecContext * avctx)
  {
      MP3On4DecodeContext *s = avctx->priv_data;
+    MPEG4AudioConfig cfg;
      int i;
  
      if ((avctx->extradata_size < 2) || (avctx->extradata == NULL)) {
@@ -2513,18 +2536,24 @@ static int decode_init_mp3on4(AVCodecContext * avctx)
          return -1;
      }
  
-    s->chan_cfg = (((unsigned char *)avctx->extradata)[1] >> 3) & 0x0f;
-    s->frames = mp3Frames[s->chan_cfg];
-    if(!s->frames) {
+    ff_mpeg4audio_get_config(&cfg, avctx->extradata, avctx->extradata_size);
+    if (!cfg.chan_config || cfg.chan_config > 7) {
          av_log(avctx, AV_LOG_ERROR, "Invalid channel config number.\n");
          return -1;
      }
-    avctx->channels = mp3Channels[s->chan_cfg];
+    s->frames = mp3Frames[cfg.chan_config];
+    s->coff = chan_offset[cfg.chan_config];
+    avctx->channels = ff_mpeg4audio_channels[cfg.chan_config];
+
+    if (cfg.sample_rate < 16000)
+        s->syncword = 0xffe00000;
+    else
+        s->syncword = 0xfff00000;
  
      /* Init the first mp3 decoder in standard way, so that all tables get builded
       * We replace avctx->priv_data with the context of the first decoder so that
       * decode_init() does not have to be changed.
-     * Other decoders will be inited here copying data from the first context
+     * Other decoders will be initialized here copying data from the first context
       */
      // Allocate zeroed memory for the first decoder context
      s->mp3decctx[0] = av_mallocz(sizeof(MPADecodeContext));
@@ -2564,81 +2593,65 @@ static int decode_close_mp3on4(AVCodecContext * avctx)
  
  static int decode_frame_mp3on4(AVCodecContext * avctx,
                          void *data, int *data_size,
-                        uint8_t * buf, int buf_size)
+                        const uint8_t * buf, int buf_size)
  {
      MP3On4DecodeContext *s = avctx->priv_data;
      MPADecodeContext *m;
-    int len, out_size = 0;
+    int fsize, len = buf_size, out_size = 0;
      uint32_t header;
      OUT_INT *out_samples = data;
      OUT_INT decoded_buf[MPA_FRAME_SIZE * MPA_MAX_CHANNELS];
      OUT_INT *outptr, *bp;
-    int fsize;
-    unsigned char *start2 = buf, *start;
-    int fr, i, j, n;
-    int off = avctx->channels;
-    int *coff = chan_offset[s->chan_cfg];
-
-    len = buf_size;
+    int fr, j, n;
  
+    *data_size = 0;
      // Discard too short frames
-    if (buf_size < HEADER_SIZE) {
-        *data_size = 0;
-        return buf_size;
-    }
+    if (buf_size < HEADER_SIZE)
+        return -1;
  
      // If only one decoder interleave is not needed
      outptr = s->frames == 1 ? out_samples : decoded_buf;
  
+    avctx->bit_rate = 0;
+
      for (fr = 0; fr < s->frames; fr++) {
-        start = start2;
-        fsize = (start[0] << 4) | (start[1] >> 4);
-        start2 += fsize;
-        if (fsize > len)
-            fsize = len;
-        len -= fsize;
-        if (fsize > MPA_MAX_CODED_FRAME_SIZE)
-            fsize = MPA_MAX_CODED_FRAME_SIZE;
+        fsize = AV_RB16(buf) >> 4;
+        fsize = FFMIN3(fsize, len, MPA_MAX_CODED_FRAME_SIZE);
          m = s->mp3decctx[fr];
          assert (m != NULL);
  
-        // Get header
-        header = (start[0] << 24) | (start[1] << 16) | (start[2] << 8) | start[3] | 0xfff00000;
+        header = (AV_RB32(buf) & 0x000fffff) | s->syncword; // patch header
  
-        if (ff_mpa_check_header(header) < 0) { // Bad header, discard block
-            *data_size = 0;
-            return buf_size;
-        }
+        if (ff_mpa_check_header(header) < 0) // Bad header, discard block
+            break;
  
          ff_mpegaudio_decode_header(m, header);
-        mp_decode_frame(m, decoded_buf, start, fsize);
+        out_size += mp_decode_frame(m, outptr, buf, fsize);
+        buf += fsize;
+        len -= fsize;
  
-        n = MPA_FRAME_SIZE * m->nb_channels;
-        out_size += n * sizeof(OUT_INT);
          if(s->frames > 1) {
+            n = m->avctx->frame_size*m->nb_channels;
              /* interleave output data */
-            bp = out_samples + coff[fr];
+            bp = out_samples + s->coff[fr];
              if(m->nb_channels == 1) {
                  for(j = 0; j < n; j++) {
                      *bp = decoded_buf[j];
-                    bp += off;
+                    bp += avctx->channels;
                  }
              } else {
                  for(j = 0; j < n; j++) {
                      bp[0] = decoded_buf[j++];
                      bp[1] = decoded_buf[j];
-                    bp += off;
+                    bp += avctx->channels;
                  }
              }
          }
+        avctx->bit_rate += m->bit_rate;
      }
  
      /* update codec info */
      avctx->sample_rate = s->mp3decctx[0]->sample_rate;
-    avctx->frame_size= buf_size;
-    avctx->bit_rate = 0;
-    for (i = 0; i < s->frames; i++)
-        avctx->bit_rate += s->mp3decctx[i]->bit_rate;
  
      *data_size = out_size;
      return buf_size;
@@ -2657,6 +2670,8 @@ AVCodec mp2_decoder =
      NULL,
      decode_frame,
      CODEC_CAP_PARSE_ONLY,
+    .flush= flush,
+    .long_name= NULL_IF_CONFIG_SMALL("MP2 (MPEG audio layer 2)"),
  };
  #endif
  #ifdef CONFIG_MP3_DECODER
@@ -2672,6 +2687,7 @@ AVCodec mp3_decoder =
      decode_frame,
      CODEC_CAP_PARSE_ONLY,
      .flush= flush,
+    .long_name= NULL_IF_CONFIG_SMALL("MP3 (MPEG audio layer 3)"),
  };
  #endif
  #ifdef CONFIG_MP3ADU_DECODER
@@ -2687,6 +2703,7 @@ AVCodec mp3adu_decoder =
      decode_frame_adu,
      CODEC_CAP_PARSE_ONLY,
      .flush= flush,
+    .long_name= NULL_IF_CONFIG_SMALL("ADU (Application Data Unit) MP3 (MPEG audio layer 3)"),
  };
  #endif
  #ifdef CONFIG_MP3ON4_DECODER
@@ -2701,5 +2718,6 @@ AVCodec mp3on4_decoder =
      decode_close_mp3on4,
      decode_frame_mp3on4,
      .flush= flush,
+    .long_name= NULL_IF_CONFIG_SMALL("MP3onMP4"),
  };
  #endif