suggest to use av_get_bytes_per_sample() in av_get_bits_per_sample_format() doxy

[ffmpeg] / libavcodec / mpegaudiodec.c
diff --git a/libavcodec/mpegaudiodec.c b/libavcodec/mpegaudiodec.c

index e5a1acecb03d87e7a290a66cef5dcb71be684065..033d76e049e7e76153a6b80b8f0ea72c8a9a8d28 100644 (file)
--- a/libavcodec/mpegaudiodec.c
+++ b/libavcodec/mpegaudiodec.c
@@ -2,20 +2,20 @@
   * MPEG Audio decoder
   * Copyright (c) 2001, 2002 Fabrice Bellard
   *
- * This file is part of FFmpeg.
+ * This file is part of Libav.
   *
- * FFmpeg is free software; you can redistribute it and/or
+ * Libav is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
   * License as published by the Free Software Foundation; either
   * version 2.1 of the License, or (at your option) any later version.
   *
- * FFmpeg is distributed in the hope that it will be useful,
+ * Libav is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * Lesser General Public License for more details.
   *
   * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
+ * License along with Libav; if not, write to the Free Software
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
@@ -24,40 +24,85 @@
   * MPEG Audio decoder.
   */
  
+#include "libavutil/audioconvert.h"
  #include "avcodec.h"
  #include "get_bits.h"
-#include "dsputil.h"
+#include "mathops.h"
+#include "mpegaudiodsp.h"
  
  /*
   * TODO:
- *  - in low precision mode, use more 16 bit multiplies in synth filter
   *  - test lsf / mpeg25 extensively.
   */
  
  #include "mpegaudio.h"
  #include "mpegaudiodecheader.h"
  
-#include "mathops.h"
+#define BACKSTEP_SIZE 512
+#define EXTRABYTES 24
+
+/* layer 3 "granule" */
+typedef struct GranuleDef {
+    uint8_t scfsi;
+    int part2_3_length;
+    int big_values;
+    int global_gain;
+    int scalefac_compress;
+    uint8_t block_type;
+    uint8_t switch_point;
+    int table_select[3];
+    int subblock_gain[3];
+    uint8_t scalefac_scale;
+    uint8_t count1table_select;
+    int region_size[3]; /* number of huffman codes in each region */
+    int preflag;
+    int short_start, long_end; /* long/short band indexes */
+    uint8_t scale_factors[40];
+    INTFLOAT sb_hybrid[SBLIMIT * 18]; /* 576 samples */
+} GranuleDef;
+
+typedef struct MPADecodeContext {
+    MPA_DECODE_HEADER
+    uint8_t last_buf[2*BACKSTEP_SIZE + EXTRABYTES];
+    int last_buf_size;
+    /* next header (used in free format parsing) */
+    uint32_t free_format_next_header;
+    GetBitContext gb;
+    GetBitContext in_gb;
+    DECLARE_ALIGNED(32, MPA_INT, synth_buf)[MPA_MAX_CHANNELS][512 * 2];
+    int synth_buf_offset[MPA_MAX_CHANNELS];
+    DECLARE_ALIGNED(32, INTFLOAT, sb_samples)[MPA_MAX_CHANNELS][36][SBLIMIT];
+    INTFLOAT mdct_buf[MPA_MAX_CHANNELS][SBLIMIT * 18]; /* previous samples, for layer 3 MDCT */
+    GranuleDef granules[2][2]; /* Used in Layer 3 */
+#ifdef DEBUG
+    int frame_count;
+#endif
+    int adu_mode; ///< 0 for standard mp3, 1 for adu formatted mp3
+    int dither_state;
+    int error_recognition;
+    AVCodecContext* avctx;
+    MPADSPContext mpadsp;
+} MPADecodeContext;
  
  #if CONFIG_FLOAT
  #   define SHR(a,b)       ((a)*(1.0f/(1<<(b))))
-#   define compute_antialias compute_antialias_float
  #   define FIXR_OLD(a)    ((int)((a) * FRAC_ONE + 0.5))
  #   define FIXR(x)        ((float)(x))
  #   define FIXHR(x)       ((float)(x))
  #   define MULH3(x, y, s) ((s)*(y)*(x))
  #   define MULLx(x, y, s) ((y)*(x))
  #   define RENAME(a) a ## _float
+#   define OUT_FMT AV_SAMPLE_FMT_FLT
  #else
  #   define SHR(a,b)       ((a)>>(b))
-#   define compute_antialias compute_antialias_integer
  /* WARNING: only correct for posititive numbers */
  #   define FIXR_OLD(a)    ((int)((a) * FRAC_ONE + 0.5))
  #   define FIXR(a)        ((int)((a) * FRAC_ONE + 0.5))
  #   define FIXHR(a)       ((int)((a) * (1LL<<32) + 0.5))
  #   define MULH3(x, y, s) MULH((s)*(x), y)
  #   define MULLx(x, y, s) MULL(x,y,s)
-#   define RENAME(a)      a
+#   define RENAME(a)      a ## _fixed
+#   define OUT_FMT AV_SAMPLE_FMT_S16
  #endif
  
  /****************/
@@ -67,17 +112,6 @@
  #include "mpegaudiodata.h"
  #include "mpegaudiodectab.h"
  
-#if CONFIG_FLOAT
-#    include "fft.h"
-#else
-#    include "dct32.c"
-#endif
-
-static void compute_antialias_integer(MPADecodeContext *s, GranuleDef *g);
-static void compute_antialias_float(MPADecodeContext *s, GranuleDef *g);
-static void apply_window_mp3_c(MPA_INT *synth_buf, MPA_INT *window,
-                               int *dither_state, OUT_INT *samples, int incr);
-
  /* vlc structure for decoding layer 3 huffman tables */
  static VLC huff_vlc[16];
  static VLC_TYPE huff_vlc_tables[
@@ -99,8 +133,7 @@ static uint16_t band_index_long[9][23];
  /* intensity stereo coef table */
  static INTFLOAT is_table[2][16];
  static INTFLOAT is_table_lsf[2][2][16];
-static int32_t csa_table[8][4];
-static float csa_table_float[8][4];
+static INTFLOAT csa_table[8][4];
  static INTFLOAT mdct_win[8][36];
  
  static int16_t division_tab3[1<<6 ];
@@ -126,8 +159,6 @@ static const int32_t scale_factor_mult2[3][3] = {
      SCALE_GEN(4.0 / 9.0), /* 9 steps */
  };
  
-DECLARE_ALIGNED(16, MPA_INT, RENAME(ff_mpa_synth_window))[512+256];
-
  /**
   * Convert region offsets to region sizes and truncate
   * size to big_values.
@@ -238,82 +269,6 @@ static inline int l3_unscale(int value, int exponent)
      return m;
  }
  
-/* all integer n^(4/3) computation code */
-#define DEV_ORDER 13
-
-#define POW_FRAC_BITS 24
-#define POW_FRAC_ONE    (1 << POW_FRAC_BITS)
-#define POW_FIX(a)   ((int)((a) * POW_FRAC_ONE))
-#define POW_MULL(a,b) (((int64_t)(a) * (int64_t)(b)) >> POW_FRAC_BITS)
-
-static int dev_4_3_coefs[DEV_ORDER];
-
-#if 0 /* unused */
-static int pow_mult3[3] = {
-    POW_FIX(1.0),
-    POW_FIX(1.25992104989487316476),
-    POW_FIX(1.58740105196819947474),
-};
-#endif
-
-static av_cold void int_pow_init(void)
-{
-    int i, a;
-
-    a = POW_FIX(1.0);
-    for(i=0;i<DEV_ORDER;i++) {
-        a = POW_MULL(a, POW_FIX(4.0 / 3.0) - i * POW_FIX(1.0)) / (i + 1);
-        dev_4_3_coefs[i] = a;
-    }
-}
-
-#if 0 /* unused, remove? */
-/* return the mantissa and the binary exponent */
-static int int_pow(int i, int *exp_ptr)
-{
-    int e, er, eq, j;
-    int a, a1;
-
-    /* renormalize */
-    a = i;
-    e = POW_FRAC_BITS;
-    while (a < (1 << (POW_FRAC_BITS - 1))) {
-        a = a << 1;
-        e--;
-    }
-    a -= (1 << POW_FRAC_BITS);
-    a1 = 0;
-    for(j = DEV_ORDER - 1; j >= 0; j--)
-        a1 = POW_MULL(a, dev_4_3_coefs[j] + a1);
-    a = (1 << POW_FRAC_BITS) + a1;
-    /* exponent compute (exact) */
-    e = e * 4;
-    er = e % 3;
-    eq = e / 3;
-    a = POW_MULL(a, pow_mult3[er]);
-    while (a >= 2 * POW_FRAC_ONE) {
-        a = a >> 1;
-        eq++;
-    }
-    /* convert to float */
-    while (a < POW_FRAC_ONE) {
-        a = a << 1;
-        eq--;
-    }
-    /* now POW_FRAC_ONE <= a < 2 * POW_FRAC_ONE */
-#if POW_FRAC_BITS > FRAC_BITS
-    a = (a + (1 << (POW_FRAC_BITS - FRAC_BITS - 1))) >> (POW_FRAC_BITS - FRAC_BITS);
-    /* correct overflow */
-    if (a >= 2 * (1 << FRAC_BITS)) {
-        a = a >> 1;
-        eq++;
-    }
-#endif
-    *exp_ptr = eq;
-    return a;
-}
-#endif
-
  static av_cold int decode_init(AVCodecContext * avctx)
  {
      MPADecodeContext *s = avctx->priv_data;
@@ -321,11 +276,8 @@ static av_cold int decode_init(AVCodecContext * avctx)
      int i, j, k;
  
      s->avctx = avctx;
-    s->apply_window_mp3 = apply_window_mp3_c;
-#if HAVE_MMX && CONFIG_FLOAT
-    ff_mpegaudiodec_init_mmx(s);
-#endif
-    if (HAVE_ALTIVEC && CONFIG_FLOAT) ff_mpegaudiodec_init_altivec(s);
+
+    ff_mpadsp_init(&s->mpadsp);
  
      avctx->sample_fmt= OUT_FMT;
      s->error_recognition= avctx->error_recognition;
@@ -350,16 +302,13 @@ static av_cold int decode_init(AVCodecContext * avctx)
              scale_factor_mult[i][0] = MULLx(norm, FIXR(1.0          * 2.0), FRAC_BITS);
              scale_factor_mult[i][1] = MULLx(norm, FIXR(0.7937005259 * 2.0), FRAC_BITS);
              scale_factor_mult[i][2] = MULLx(norm, FIXR(0.6299605249 * 2.0), FRAC_BITS);
-            dprintf(avctx, "%d: norm=%x s=%x %x %x\n",
+            av_dlog(avctx, "%d: norm=%x s=%x %x %x\n",
                      i, norm,
                      scale_factor_mult[i][0],
                      scale_factor_mult[i][1],
                      scale_factor_mult[i][2]);
          }
  
-#if CONFIG_FLOAT
-        ff_dct_init(&s->dct, 5, DCT_II);
-#endif
          RENAME(ff_mpa_synth_init)(RENAME(ff_mpa_synth_window));
  
          /* huffman decode tables */
@@ -415,7 +364,6 @@ static av_cold int decode_init(AVCodecContext * avctx)
  
          /* compute n ^ (4/3) and store it in mantissa/exp format */
  
-        int_pow_init();
          mpegaudio_tableinit();
  
          for (i = 0; i < 4; i++)
@@ -458,8 +406,9 @@ static av_cold int decode_init(AVCodecContext * avctx)
                  k = i & 1;
                  is_table_lsf[j][k ^ 1][i] = FIXR(f);
                  is_table_lsf[j][k][i] = FIXR(1.0);
-                dprintf(avctx, "is_table_lsf %d %d: %x %x\n",
-                        i, j, is_table_lsf[j][0][i], is_table_lsf[j][1][i]);
+                av_dlog(avctx, "is_table_lsf %d %d: %f %f\n",
+                        i, j, (float) is_table_lsf[j][0][i],
+                        (float) is_table_lsf[j][1][i]);
              }
          }
  
@@ -468,14 +417,17 @@ static av_cold int decode_init(AVCodecContext * avctx)
              ci = ci_table[i];
              cs = 1.0 / sqrt(1.0 + ci * ci);
              ca = cs * ci;
+#if !CONFIG_FLOAT
              csa_table[i][0] = FIXHR(cs/4);
              csa_table[i][1] = FIXHR(ca/4);
              csa_table[i][2] = FIXHR(ca/4) + FIXHR(cs/4);
              csa_table[i][3] = FIXHR(ca/4) - FIXHR(cs/4);
-            csa_table_float[i][0] = cs;
-            csa_table_float[i][1] = ca;
-            csa_table_float[i][2] = ca + cs;
-            csa_table_float[i][3] = ca - cs;
+#else
+            csa_table[i][0] = cs;
+            csa_table[i][1] = ca;
+            csa_table[i][2] = ca + cs;
+            csa_table[i][3] = ca - cs;
+#endif
          }
  
          /* compute mdct windows */
@@ -523,219 +475,6 @@ static av_cold int decode_init(AVCodecContext * avctx)
      return 0;
  }
  
-
-#if CONFIG_FLOAT
-static inline float round_sample(float *sum)
-{
-    float sum1=*sum;
-    *sum = 0;
-    return sum1;
-}
-
-/* signed 16x16 -> 32 multiply add accumulate */
-#define MACS(rt, ra, rb) rt+=(ra)*(rb)
-
-/* signed 16x16 -> 32 multiply */
-#define MULS(ra, rb) ((ra)*(rb))
-
-#define MLSS(rt, ra, rb) rt-=(ra)*(rb)
-
-#elif FRAC_BITS <= 15
-
-static inline int round_sample(int *sum)
-{
-    int sum1;
-    sum1 = (*sum) >> OUT_SHIFT;
-    *sum &= (1<<OUT_SHIFT)-1;
-    return av_clip(sum1, OUT_MIN, OUT_MAX);
-}
-
-/* signed 16x16 -> 32 multiply add accumulate */
-#define MACS(rt, ra, rb) MAC16(rt, ra, rb)
-
-/* signed 16x16 -> 32 multiply */
-#define MULS(ra, rb) MUL16(ra, rb)
-
-#define MLSS(rt, ra, rb) MLS16(rt, ra, rb)
-
-#else
-
-static inline int round_sample(int64_t *sum)
-{
-    int sum1;
-    sum1 = (int)((*sum) >> OUT_SHIFT);
-    *sum &= (1<<OUT_SHIFT)-1;
-    return av_clip(sum1, OUT_MIN, OUT_MAX);
-}
-
-#   define MULS(ra, rb) MUL64(ra, rb)
-#   define MACS(rt, ra, rb) MAC64(rt, ra, rb)
-#   define MLSS(rt, ra, rb) MLS64(rt, ra, rb)
-#endif
-
-#define SUM8(op, sum, w, p)               \
-{                                         \
-    op(sum, (w)[0 * 64], (p)[0 * 64]);    \
-    op(sum, (w)[1 * 64], (p)[1 * 64]);    \
-    op(sum, (w)[2 * 64], (p)[2 * 64]);    \
-    op(sum, (w)[3 * 64], (p)[3 * 64]);    \
-    op(sum, (w)[4 * 64], (p)[4 * 64]);    \
-    op(sum, (w)[5 * 64], (p)[5 * 64]);    \
-    op(sum, (w)[6 * 64], (p)[6 * 64]);    \
-    op(sum, (w)[7 * 64], (p)[7 * 64]);    \
-}
-
-#define SUM8P2(sum1, op1, sum2, op2, w1, w2, p) \
-{                                               \
-    INTFLOAT tmp;\
-    tmp = p[0 * 64];\
-    op1(sum1, (w1)[0 * 64], tmp);\
-    op2(sum2, (w2)[0 * 64], tmp);\
-    tmp = p[1 * 64];\
-    op1(sum1, (w1)[1 * 64], tmp);\
-    op2(sum2, (w2)[1 * 64], tmp);\
-    tmp = p[2 * 64];\
-    op1(sum1, (w1)[2 * 64], tmp);\
-    op2(sum2, (w2)[2 * 64], tmp);\
-    tmp = p[3 * 64];\
-    op1(sum1, (w1)[3 * 64], tmp);\
-    op2(sum2, (w2)[3 * 64], tmp);\
-    tmp = p[4 * 64];\
-    op1(sum1, (w1)[4 * 64], tmp);\
-    op2(sum2, (w2)[4 * 64], tmp);\
-    tmp = p[5 * 64];\
-    op1(sum1, (w1)[5 * 64], tmp);\
-    op2(sum2, (w2)[5 * 64], tmp);\
-    tmp = p[6 * 64];\
-    op1(sum1, (w1)[6 * 64], tmp);\
-    op2(sum2, (w2)[6 * 64], tmp);\
-    tmp = p[7 * 64];\
-    op1(sum1, (w1)[7 * 64], tmp);\
-    op2(sum2, (w2)[7 * 64], tmp);\
-}
-
-void av_cold RENAME(ff_mpa_synth_init)(MPA_INT *window)
-{
-    int i, j;
-
-    /* max = 18760, max sum over all 16 coefs : 44736 */
-    for(i=0;i<257;i++) {
-        INTFLOAT v;
-        v = ff_mpa_enwindow[i];
-#if CONFIG_FLOAT
-        v *= 1.0 / (1LL<<(16 + FRAC_BITS));
-#elif WFRAC_BITS < 16
-        v = (v + (1 << (16 - WFRAC_BITS - 1))) >> (16 - WFRAC_BITS);
-#endif
-        window[i] = v;
-        if ((i & 63) != 0)
-            v = -v;
-        if (i != 0)
-            window[512 - i] = v;
-    }
-
-    // Needed for avoiding shuffles in ASM implementations
-    for(i=0; i < 8; i++)
-        for(j=0; j < 16; j++)
-            window[512+16*i+j] = window[64*i+32-j];
-
-    for(i=0; i < 8; i++)
-        for(j=0; j < 16; j++)
-            window[512+128+16*i+j] = window[64*i+48-j];
-}
-
-static void apply_window_mp3_c(MPA_INT *synth_buf, MPA_INT *window,
-                               int *dither_state, OUT_INT *samples, int incr)
-{
-    register const MPA_INT *w, *w2, *p;
-    int j;
-    OUT_INT *samples2;
-#if CONFIG_FLOAT
-    float sum, sum2;
-#elif FRAC_BITS <= 15
-    int sum, sum2;
-#else
-    int64_t sum, sum2;
-#endif
-
-    /* copy to avoid wrap */
-    memcpy(synth_buf + 512, synth_buf, 32 * sizeof(*synth_buf));
-
-    samples2 = samples + 31 * incr;
-    w = window;
-    w2 = window + 31;
-
-    sum = *dither_state;
-    p = synth_buf + 16;
-    SUM8(MACS, sum, w, p);
-    p = synth_buf + 48;
-    SUM8(MLSS, sum, w + 32, p);
-    *samples = round_sample(&sum);
-    samples += incr;
-    w++;
-
-    /* we calculate two samples at the same time to avoid one memory
-       access per two sample */
-    for(j=1;j<16;j++) {
-        sum2 = 0;
-        p = synth_buf + 16 + j;
-        SUM8P2(sum, MACS, sum2, MLSS, w, w2, p);
-        p = synth_buf + 48 - j;
-        SUM8P2(sum, MLSS, sum2, MLSS, w + 32, w2 + 32, p);
-
-        *samples = round_sample(&sum);
-        samples += incr;
-        sum += sum2;
-        *samples2 = round_sample(&sum);
-        samples2 -= incr;
-        w++;
-        w2--;
-    }
-
-    p = synth_buf + 32;
-    SUM8(MLSS, sum, w + 32, p);
-    *samples = round_sample(&sum);
-    *dither_state= sum;
-}
-
-
-/* 32 sub band synthesis filter. Input: 32 sub band samples, Output:
-   32 samples. */
-/* XXX: optimize by avoiding ring buffer usage */
-#if !CONFIG_FLOAT
-void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
-                         MPA_INT *window, int *dither_state,
-                         OUT_INT *samples, int incr,
-                         INTFLOAT sb_samples[SBLIMIT])
-{
-    register MPA_INT *synth_buf;
-    int offset;
-#if FRAC_BITS <= 15
-    int32_t tmp[32];
-    int j;
-#endif
-
-    offset = *synth_buf_offset;
-    synth_buf = synth_buf_ptr + offset;
-
-#if FRAC_BITS <= 15
-    dct32(tmp, sb_samples);
-    for(j=0;j<32;j++) {
-        /* NOTE: can cause a loss in precision if very high amplitude
-           sound */
-        synth_buf[j] = av_clip_int16(tmp[j]);
-    }
-#else
-    dct32(synth_buf, sb_samples);
-#endif
-
-    apply_window_mp3_c(synth_buf, window, dither_state, samples, incr);
-
-    offset = (offset - 32) & 511;
-    *synth_buf_offset = offset;
-}
-#endif
-
  #define C3 FIXHR(0.86602540378443864676/2)
  
  /* 0.5 / cos(pi*(2*i+1)/36) */
@@ -987,7 +726,7 @@ static int mp_decode_layer2(MPADecodeContext *s)
      else
          bound = sblimit;
  
-    dprintf(s->avctx, "bound=%d sblimit=%d\n", bound, sblimit);
+    av_dlog(s->avctx, "bound=%d sblimit=%d\n", bound, sblimit);
  
      /* sanity check */
      if( bound > sblimit ) bound = sblimit;
@@ -1310,7 +1049,7 @@ static int huffman_decode(MPADecodeContext *s, GranuleDef *g,
  
              exponent= exponents[s_index];
  
-            dprintf(s->avctx, "region=%d n=%d x=%d y=%d exp=%d\n",
+            av_dlog(s->avctx, "region=%d n=%d x=%d y=%d exp=%d\n",
                      i, g->region_size[i] - j, x, y, exponent);
              if(y&16){
                  x = y >> 5;
@@ -1378,7 +1117,7 @@ static int huffman_decode(MPADecodeContext *s, GranuleDef *g,
          last_pos= pos;
  
          code = get_vlc2(&s->gb, vlc->table, vlc->bits, 1);
-        dprintf(s->avctx, "t=%d code=%d\n", g->count1table_select, code);
+        av_dlog(s->avctx, "t=%d code=%d\n", g->count1table_select, code);
          g->sb_hybrid[s_index+0]=
          g->sb_hybrid[s_index+1]=
          g->sb_hybrid[s_index+2]=
@@ -1575,50 +1314,26 @@ static void compute_stereo(MPADecodeContext *s,
      }
  }
  
-static void compute_antialias_integer(MPADecodeContext *s,
-                              GranuleDef *g)
-{
-    int32_t *ptr, *csa;
-    int n, i;
-
-    /* we antialias only "long" bands */
-    if (g->block_type == 2) {
-        if (!g->switch_point)
-            return;
-        /* XXX: check this for 8000Hz case */
-        n = 1;
-    } else {
-        n = SBLIMIT - 1;
-    }
-
-    ptr = g->sb_hybrid + 18;
-    for(i = n;i > 0;i--) {
-        int tmp0, tmp1, tmp2;
-        csa = &csa_table[0][0];
-#define INT_AA(j) \
-            tmp0 = ptr[-1-j];\
-            tmp1 = ptr[   j];\
-            tmp2= MULH(tmp0 + tmp1, csa[0+4*j]);\
-            ptr[-1-j] = 4*(tmp2 - MULH(tmp1, csa[2+4*j]));\
-            ptr[   j] = 4*(tmp2 + MULH(tmp0, csa[3+4*j]));
-
-        INT_AA(0)
-        INT_AA(1)
-        INT_AA(2)
-        INT_AA(3)
-        INT_AA(4)
-        INT_AA(5)
-        INT_AA(6)
-        INT_AA(7)
-
-        ptr += 18;
-    }
-}
+#if CONFIG_FLOAT
+#define AA(j) do {                                                      \
+        float tmp0 = ptr[-1-j];                                         \
+        float tmp1 = ptr[   j];                                         \
+        ptr[-1-j] = tmp0 * csa_table[j][0] - tmp1 * csa_table[j][1];    \
+        ptr[   j] = tmp0 * csa_table[j][1] + tmp1 * csa_table[j][0];    \
+    } while (0)
+#else
+#define AA(j) do {                                              \
+        int tmp0 = ptr[-1-j];                                   \
+        int tmp1 = ptr[   j];                                   \
+        int tmp2 = MULH(tmp0 + tmp1, csa_table[j][0]);          \
+        ptr[-1-j] = 4*(tmp2 - MULH(tmp1, csa_table[j][2]));     \
+        ptr[   j] = 4*(tmp2 + MULH(tmp0, csa_table[j][3]));     \
+    } while (0)
+#endif
  
-static void compute_antialias_float(MPADecodeContext *s,
-                              GranuleDef *g)
+static void compute_antialias(MPADecodeContext *s, GranuleDef *g)
  {
-    float *ptr;
+    INTFLOAT *ptr;
      int n, i;
  
      /* we antialias only "long" bands */
@@ -1633,22 +1348,14 @@ static void compute_antialias_float(MPADecodeContext *s,
  
      ptr = g->sb_hybrid + 18;
      for(i = n;i > 0;i--) {
-        float tmp0, tmp1;
-        float *csa = &csa_table_float[0][0];
-#define FLOAT_AA(j)\
-        tmp0= ptr[-1-j];\
-        tmp1= ptr[   j];\
-        ptr[-1-j] = tmp0 * csa[0+4*j] - tmp1 * csa[1+4*j];\
-        ptr[   j] = tmp0 * csa[1+4*j] + tmp1 * csa[0+4*j];
-
-        FLOAT_AA(0)
-        FLOAT_AA(1)
-        FLOAT_AA(2)
-        FLOAT_AA(3)
-        FLOAT_AA(4)
-        FLOAT_AA(5)
-        FLOAT_AA(6)
-        FLOAT_AA(7)
+        AA(0);
+        AA(1);
+        AA(2);
+        AA(3);
+        AA(4);
+        AA(5);
+        AA(6);
+        AA(7);
  
          ptr += 18;
      }
@@ -1748,7 +1455,7 @@ static void compute_imdct(MPADecodeContext *s,
  /* main layer3 decoding function */
  static int mp_decode_layer3(MPADecodeContext *s)
  {
-    int nb_granules, main_data_begin, private_bits;
+    int nb_granules, main_data_begin;
      int gr, ch, blocksplit_flag, i, j, k, n, bits_pos;
      GranuleDef *g;
      int16_t exponents[576]; //FIXME try INTFLOAT
@@ -1756,14 +1463,14 @@ static int mp_decode_layer3(MPADecodeContext *s)
      /* read side info */
      if (s->lsf) {
          main_data_begin = get_bits(&s->gb, 8);
-        private_bits = get_bits(&s->gb, s->nb_channels);
+        skip_bits(&s->gb, s->nb_channels);
          nb_granules = 1;
      } else {
          main_data_begin = get_bits(&s->gb, 9);
          if (s->nb_channels == 2)
-            private_bits = get_bits(&s->gb, 3);
+            skip_bits(&s->gb, 3);
          else
-            private_bits = get_bits(&s->gb, 5);
+            skip_bits(&s->gb, 5);
          nb_granules = 2;
          for(ch=0;ch<s->nb_channels;ch++) {
              s->granules[ch][0].scfsi = 0;/* all scale factors are transmitted */
@@ -1773,7 +1480,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
  
      for(gr=0;gr<nb_granules;gr++) {
          for(ch=0;ch<s->nb_channels;ch++) {
-            dprintf(s->avctx, "gr=%d ch=%d: side_info\n", gr, ch);
+            av_dlog(s->avctx, "gr=%d ch=%d: side_info\n", gr, ch);
              g = &s->granules[ch][gr];
              g->part2_3_length = get_bits(&s->gb, 12);
              g->big_values = get_bits(&s->gb, 9);
@@ -1814,7 +1521,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
                  /* compute huffman coded region sizes */
                  region_address1 = get_bits(&s->gb, 4);
                  region_address2 = get_bits(&s->gb, 3);
-                dprintf(s->avctx, "region1=%d region2=%d\n",
+                av_dlog(s->avctx, "region1=%d region2=%d\n",
                          region_address1, region_address2);
                  ff_init_long_region(s, g, region_address1, region_address2);
              }
@@ -1826,7 +1533,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
                  g->preflag = get_bits1(&s->gb);
              g->scalefac_scale = get_bits1(&s->gb);
              g->count1table_select = get_bits1(&s->gb);
-            dprintf(s->avctx, "block_type=%d switch_point=%d\n",
+            av_dlog(s->avctx, "block_type=%d switch_point=%d\n",
                      g->block_type, g->switch_point);
          }
      }
@@ -1835,7 +1542,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
      const uint8_t *ptr = s->gb.buffer + (get_bits_count(&s->gb)>>3);
      assert((get_bits_count(&s->gb) & 7) == 0);
      /* now we get bits from the main_data_begin offset */
-    dprintf(s->avctx, "seekback: %d\n", main_data_begin);
+    av_dlog(s->avctx, "seekback: %d\n", main_data_begin);
  //av_log(NULL, AV_LOG_ERROR, "backstep:%d, lastbuf:%d\n", main_data_begin, s->last_buf_size);
  
      memcpy(s->last_buf + s->last_buf_size, ptr, EXTRABYTES);
@@ -1869,7 +1576,7 @@ static int mp_decode_layer3(MPADecodeContext *s)
                  /* MPEG1 scale factors */
                  slen1 = slen_table[0][g->scalefac_compress];
                  slen2 = slen_table[1][g->scalefac_compress];
-                dprintf(s->avctx, "slen1=%d slen2=%d\n", slen1, slen2);
+                av_dlog(s->avctx, "slen1=%d slen2=%d\n", slen1, slen2);
                  if (g->block_type == 2) {
                      n = g->switch_point ? 17 : 18;
                      j = 0;
@@ -2002,7 +1709,7 @@ static int mp_decode_frame(MPADecodeContext *s,
      if (s->error_protection)
          skip_bits(&s->gb, 16);
  
-    dprintf(s->avctx, "frame %d:\n", s->frame_count);
+    av_dlog(s->avctx, "frame %d:\n", s->frame_count);
      switch(s->layer) {
      case 1:
          s->avctx->frame_size = 384;
@@ -2051,9 +1758,7 @@ static int mp_decode_frame(MPADecodeContext *s,
          samples_ptr = samples + ch;
          for(i=0;i<nb_frames;i++) {
              RENAME(ff_mpa_synth_filter)(
-#if CONFIG_FLOAT
-                         s,
-#endif
+                         &s->mpadsp,
                           s->synth_buf[ch], &(s->synth_buf_offset[ch]),
                           RENAME(ff_mpa_synth_window), &s->dither_state,
                           samples_ptr, s->nb_channels,
@@ -2092,7 +1797,9 @@ static int decode_frame(AVCodecContext * avctx,
      }
      /* update codec info */
      avctx->channels = s->nb_channels;
-    avctx->bit_rate = s->bit_rate;
+    avctx->channel_layout = s->nb_channels == 1 ? AV_CH_LAYOUT_MONO : AV_CH_LAYOUT_STEREO;
+    if (!avctx->bit_rate)
+        avctx->bit_rate = s->bit_rate;
      avctx->sub_id = s->layer;
  
      if(*data_size < 1152*avctx->channels*sizeof(OUT_INT))
@@ -2160,7 +1867,8 @@ static int decode_frame_adu(AVCodecContext * avctx,
      /* update codec info */
      avctx->sample_rate = s->sample_rate;
      avctx->channels = s->nb_channels;
-    avctx->bit_rate = s->bit_rate;
+    if (!avctx->bit_rate)
+        avctx->bit_rate = s->bit_rate;
      avctx->sub_id = s->layer;
  
      s->frame_size = len;
@@ -2263,8 +1971,7 @@ static av_cold int decode_close_mp3on4(AVCodecContext * avctx)
      int i;
  
      for (i = 0; i < s->frames; i++)
-        if (s->mp3decctx[i])
-            av_free(s->mp3decctx[i]);
+        av_free(s->mp3decctx[i]);
  
      return 0;
  }
@@ -2344,7 +2051,7 @@ static int decode_frame_mp3on4(AVCodecContext * avctx,
  
  #if !CONFIG_FLOAT
  #if CONFIG_MP1_DECODER
-AVCodec mp1_decoder =
+AVCodec ff_mp1_decoder =
  {
      "mp1",
      AVMEDIA_TYPE_AUDIO,
@@ -2360,7 +2067,7 @@ AVCodec mp1_decoder =
  };
  #endif
  #if CONFIG_MP2_DECODER
-AVCodec mp2_decoder =
+AVCodec ff_mp2_decoder =
  {
      "mp2",
      AVMEDIA_TYPE_AUDIO,
@@ -2376,7 +2083,7 @@ AVCodec mp2_decoder =
  };
  #endif
  #if CONFIG_MP3_DECODER
-AVCodec mp3_decoder =
+AVCodec ff_mp3_decoder =
  {
      "mp3",
      AVMEDIA_TYPE_AUDIO,
@@ -2392,7 +2099,7 @@ AVCodec mp3_decoder =
  };
  #endif
  #if CONFIG_MP3ADU_DECODER
-AVCodec mp3adu_decoder =
+AVCodec ff_mp3adu_decoder =
  {
      "mp3adu",
      AVMEDIA_TYPE_AUDIO,
@@ -2408,7 +2115,7 @@ AVCodec mp3adu_decoder =
  };
  #endif
  #if CONFIG_MP3ON4_DECODER
-AVCodec mp3on4_decoder =
+AVCodec ff_mp3on4_decoder =
  {
      "mp3on4",
      AVMEDIA_TYPE_AUDIO,