x86: Refactor PSWAPD fallback implementations and port to cpuflags

[ffmpeg] / libavcodec / amrnbdec.c
diff --git a/libavcodec/amrnbdec.c b/libavcodec/amrnbdec.c

index 616be9710e607cfb99860e7c3c2ab65c0d379274..21966456a0f12b98f11e1bd5582a427b05ea9db0 100644 (file)
--- a/libavcodec/amrnbdec.c
+++ b/libavcodec/amrnbdec.c
@@ -3,20 +3,20 @@
   * Copyright (c) 2006-2007 Robert Swain
   * Copyright (c) 2009 Colin McQuillan
   *
- * This file is part of FFmpeg.
+ * This file is part of Libav.
   *
- * FFmpeg is free software; you can redistribute it and/or
+ * Libav is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
   * License as published by the Free Software Foundation; either
   * version 2.1 of the License, or (at your option) any later version.
   *
- * FFmpeg is distributed in the hope that it will be useful,
+ * Libav is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * Lesser General Public License for more details.
   *
   * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
+ * License along with Libav; if not, write to the Free Software
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
@@ -43,15 +43,16 @@
  #include <string.h>
  #include <math.h>
  
+#include "libavutil/audioconvert.h"
  #include "avcodec.h"
-#include "get_bits.h"
+#include "dsputil.h"
  #include "libavutil/common.h"
-#include "celp_math.h"
  #include "celp_filters.h"
  #include "acelp_filters.h"
  #include "acelp_vectors.h"
  #include "acelp_pitch_delay.h"
  #include "lsp.h"
+#include "amr.h"
  
  #include "amrnbdata.h"
  
@@ -82,7 +83,7 @@
  /** Maximum sharpening factor
   *
   * The specification says 0.8, which should be 13107, but the reference C code
- * uses 13017 instead. (Amusingly the same applies to SHARP_MAX in g729dec.c.)
+ * uses 13017 instead. (Amusingly the same applies to SHARP_MAX in bitexact G.729.)
   */
  #define SHARP_MAX 0.79449462890625
  
@@ -94,6 +95,7 @@
  #define AMR_AGC_ALPHA      0.9
  
  typedef struct AMRContext {
+    AVFrame                         avframe; ///< AVFrame for decoded samples
      AMRNBFrame                        frame; ///< decoded AMR parameters (lsf coefficients, codebook indexes, etc)
      uint8_t             bad_frame_indicator; ///< bad frame ? 1 : 0
      enum Mode                cur_frame_mode;
@@ -153,7 +155,15 @@ static av_cold int amrnb_decode_init(AVCodecContext *avctx)
      AMRContext *p = avctx->priv_data;
      int i;
  
-    avctx->sample_fmt = SAMPLE_FMT_FLT;
+    if (avctx->channels > 1) {
+        av_log_missing_feature(avctx, "multi-channel AMR", 0);
+        return AVERROR_PATCHWELCOME;
+    }
+
+    avctx->channels       = 1;
+    avctx->channel_layout = AV_CH_LAYOUT_MONO;
+    avctx->sample_rate    = 8000;
+    avctx->sample_fmt     = AV_SAMPLE_FMT_FLT;
  
      // p->excitation always points to the same position in p->excitation_buf
      p->excitation = &p->excitation_buf[PITCH_DELAY_MAX + LP_FILTER_ORDER + 1];
@@ -166,6 +176,9 @@ static av_cold int amrnb_decode_init(AVCodecContext *avctx)
      for (i = 0; i < 4; i++)
          p->prediction_error[i] = MIN_ENERGY;
  
+    avcodec_get_frame_defaults(&p->avframe);
+    avctx->coded_frame = &p->avframe;
+
      return 0;
  }
  
@@ -184,41 +197,25 @@ static av_cold int amrnb_decode_init(AVCodecContext *avctx)
  static enum Mode unpack_bitstream(AMRContext *p, const uint8_t *buf,
                                    int buf_size)
  {
-    GetBitContext gb;
      enum Mode mode;
  
-    init_get_bits(&gb, buf, buf_size * 8);
-
      // Decode the first octet.
-    skip_bits(&gb, 1);                        // padding bit
-    mode = get_bits(&gb, 4);                  // frame type
-    p->bad_frame_indicator = !get_bits1(&gb); // quality bit
-    skip_bits(&gb, 2);                        // two padding bits
-
-    if (mode < MODE_DTX) {
-        uint16_t *data = (uint16_t *)&p->frame;
-        const uint8_t *order = amr_unpacking_bitmaps_per_mode[mode];
-        int field_size;
-
-        memset(&p->frame, 0, sizeof(AMRNBFrame));
-        buf++;
-        while ((field_size = *order++)) {
-            int field = 0;
-            int field_offset = *order++;
-            while (field_size--) {
-               int bit = *order++;
-               field <<= 1;
-               field |= buf[bit >> 3] >> (bit & 7) & 1;
-            }
-            data[field_offset] = field;
-        }
+    mode = buf[0] >> 3 & 0x0F;                      // frame type
+    p->bad_frame_indicator = (buf[0] & 0x4) != 0x4; // quality bit
+
+    if (mode >= N_MODES || buf_size < frame_sizes_nb[mode] + 1) {
+        return NO_DATA;
      }
  
+    if (mode < MODE_DTX)
+        ff_amr_bit_reorder((uint16_t *) &p->frame, sizeof(AMRNBFrame), buf + 1,
+                           amr_unpacking_bitmaps_per_mode[mode]);
+
      return mode;
  }
  
  
-/// @defgroup amr_lpc_decoding AMR pitch LPC coefficient decoding functions
+/// @name AMR pitch LPC coefficient decoding functions
  /// @{
  
  /**
@@ -269,7 +266,7 @@ static void lsf2lsp_for_mode12k2(AMRContext *p, double lsp[LP_FILTER_ORDER],
      }
  
      if (update)
-        memcpy(p->prev_lsf_r, lsf_r, LP_FILTER_ORDER * sizeof(float));
+        memcpy(p->prev_lsf_r, lsf_r, LP_FILTER_ORDER * sizeof(*lsf_r));
  
      for (i = 0; i < LP_FILTER_ORDER; i++)
          lsf_q[i] = lsf_r[i] * (LSF_R_FAC / 8000.0) + lsf_no_r[i] * (1.0 / 8000.0);
@@ -355,7 +352,7 @@ static void lsf2lsp_3(AMRContext *p)
  /// @}
  
  
-/// @defgroup amr_pitch_vector_decoding AMR pitch vector decoding functions
+/// @name AMR pitch vector decoding functions
  /// @{
  
  /**
@@ -417,7 +414,7 @@ static void decode_pitch_vector(AMRContext *p,
  /// @}
  
  
-/// @defgroup amr_algebraic_code_book AMR algebraic code book (fixed) vector decoding functions
+/// @name AMR algebraic code book (fixed) vector decoding functions
  /// @{
  
  /**
@@ -561,7 +558,7 @@ static void pitch_sharpening(AMRContext *p, int subframe, enum Mode mode,
  /// @}
  
  
-/// @defgroup amr_gain_decoding AMR gain decoding functions
+/// @name AMR gain decoding functions
  /// @{
  
  /**
@@ -647,7 +644,7 @@ static void decode_gains(AMRContext *p, const AMRNBSubframe *amr_subframe,
  /// @}
  
  
-/// @defgroup amr_pre_processing AMR pre-processing functions
+/// @name AMR preprocessing functions
  /// @{
  
  /**
@@ -663,7 +660,7 @@ static void decode_gains(AMRContext *p, const AMRNBSubframe *amr_subframe,
  static void apply_ir_filter(float *out, const AMRFixed *in,
                              const float *filter)
  {
-    float filter1[AMR_SUBFRAME_SIZE],     //!< filters at pitch lag*1 and *2
+    float filter1[AMR_SUBFRAME_SIZE],     ///< filters at pitch lag*1 and *2
            filter2[AMR_SUBFRAME_SIZE];
      int   lag = in->pitch_lag;
      float fac = in->pitch_fac;
@@ -765,7 +762,7 @@ static const float *anti_sparseness(AMRContext *p, AMRFixed *fixed_sparse,
  /// @}
  
  
-/// @defgroup amr_synthesis AMR synthesis functions
+/// @name AMR synthesis functions
  /// @{
  
  /**
@@ -796,8 +793,8 @@ static int synthesis(AMRContext *p, float *lpc,
  
      // emphasize pitch vector contribution
      if (p->pitch_gain[4] > 0.5 && !overflow) {
-        float energy = ff_dot_productf(excitation, excitation,
-                                       AMR_SUBFRAME_SIZE);
+        float energy = ff_scalarproduct_float_c(excitation, excitation,
+                                                AMR_SUBFRAME_SIZE);
          float pitch_factor =
              p->pitch_gain[4] *
              (p->cur_frame_mode == MODE_12k2 ?
@@ -826,7 +823,7 @@ static int synthesis(AMRContext *p, float *lpc,
  /// @}
  
  
-/// @defgroup amr_update AMR update functions
+/// @name AMR update functions
  /// @{
  
  /**
@@ -851,7 +848,7 @@ static void update_state(AMRContext *p)
  /// @}
  
  
-/// @defgroup amr_postproc AMR Post processing functions
+/// @name AMR Postprocessing functions
  /// @{
  
  /**
@@ -873,8 +870,8 @@ static float tilt_factor(float *lpc_n, float *lpc_d)
      ff_celp_lp_synthesis_filterf(hf, lpc_d, hf, AMR_TILT_RESPONSE,
                                   LP_FILTER_ORDER);
  
-    rh0 = ff_dot_productf(hf, hf,     AMR_TILT_RESPONSE);
-    rh1 = ff_dot_productf(hf, hf + 1, AMR_TILT_RESPONSE - 1);
+    rh0 = ff_scalarproduct_float_c(hf, hf,     AMR_TILT_RESPONSE);
+    rh1 = ff_scalarproduct_float_c(hf, hf + 1, AMR_TILT_RESPONSE - 1);
  
      // The spec only specifies this check for 12.2 and 10.2 kbit/s
      // modes. But in the ref source the tilt is always non-negative.
@@ -894,8 +891,8 @@ static void postfilter(AMRContext *p, float *lpc, float *buf_out)
      int i;
      float *samples          = p->samples_in + LP_FILTER_ORDER; // Start of input
  
-    float speech_gain       = ff_dot_productf(samples, samples,
-                                              AMR_SUBFRAME_SIZE);
+    float speech_gain       = ff_scalarproduct_float_c(samples, samples,
+                                                       AMR_SUBFRAME_SIZE);
  
      float pole_out[AMR_SUBFRAME_SIZE + LP_FILTER_ORDER];  // Output of pole filter
      const float *gamma_n, *gamma_d;                       // Formant filter factor table
@@ -933,25 +930,37 @@ static void postfilter(AMRContext *p, float *lpc, float *buf_out)
  
  /// @}
  
-static int amrnb_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
-                              AVPacket *avpkt)
+static int amrnb_decode_frame(AVCodecContext *avctx, void *data,
+                              int *got_frame_ptr, AVPacket *avpkt)
  {
  
      AMRContext *p = avctx->priv_data;        // pointer to private data
      const uint8_t *buf = avpkt->data;
      int buf_size       = avpkt->size;
-    float *buf_out = data;                   // pointer to the output data buffer
-    int i, subframe;
+    float *buf_out;                          // pointer to the output data buffer
+    int i, subframe, ret;
      float fixed_gain_factor;
      AMRFixed fixed_sparse = {0};             // fixed vector up to anti-sparseness processing
      float spare_vector[AMR_SUBFRAME_SIZE];   // extra stack space to hold result from anti-sparseness processing
      float synth_fixed_gain;                  // the fixed gain that synthesis should use
      const float *synth_fixed_vector;         // pointer to the fixed vector that synthesis should use
  
+    /* get output buffer */
+    p->avframe.nb_samples = AMR_BLOCK_SIZE;
+    if ((ret = avctx->get_buffer(avctx, &p->avframe)) < 0) {
+        av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
+        return ret;
+    }
+    buf_out = (float *)p->avframe.data[0];
+
      p->cur_frame_mode = unpack_bitstream(p, buf, buf_size);
+    if (p->cur_frame_mode == NO_DATA) {
+        av_log(avctx, AV_LOG_ERROR, "Corrupt bitstream\n");
+        return AVERROR_INVALIDDATA;
+    }
      if (p->cur_frame_mode == MODE_DTX) {
          av_log_missing_feature(avctx, "dtx mode", 1);
-        return -1;
+        return AVERROR_PATCHWELCOME;
      }
  
      if (p->cur_frame_mode == MODE_12k2) {
@@ -979,13 +988,19 @@ static int amrnb_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
  
          pitch_sharpening(p, subframe, p->cur_frame_mode, &fixed_sparse);
  
+        if (fixed_sparse.pitch_lag == 0) {
+            av_log(avctx, AV_LOG_ERROR, "The file is corrupted, pitch_lag = 0 is not allowed\n");
+            return AVERROR_INVALIDDATA;
+        }
          ff_set_fixed_vector(p->fixed_vector, &fixed_sparse, 1.0,
                              AMR_SUBFRAME_SIZE);
  
          p->fixed_gain[4] =
              ff_amr_set_fixed_gain(fixed_gain_factor,
-                       ff_dot_productf(p->fixed_vector, p->fixed_vector,
-                                       AMR_SUBFRAME_SIZE)/AMR_SUBFRAME_SIZE,
+                                  ff_scalarproduct_float_c(p->fixed_vector,
+                                                           p->fixed_vector,
+                                                           AMR_SUBFRAME_SIZE) /
+                                  AMR_SUBFRAME_SIZE,
                         p->prediction_error,
                         energy_mean[p->cur_frame_mode], energy_pred_fac);
  
@@ -1042,21 +1057,23 @@ static int amrnb_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
      ff_weighted_vector_sumf(p->lsf_avg, p->lsf_avg, p->lsf_q[3],
                              0.84, 0.16, LP_FILTER_ORDER);
  
-    /* report how many samples we got */
-    *data_size = AMR_BLOCK_SIZE * sizeof(float);
+    *got_frame_ptr   = 1;
+    *(AVFrame *)data = p->avframe;
  
      /* return the amount of bytes consumed if everything was OK */
      return frame_sizes_nb[p->cur_frame_mode] + 1; // +7 for rounding and +8 for TOC
  }
  
  
-AVCodec amrnb_decoder = {
+AVCodec ff_amrnb_decoder = {
      .name           = "amrnb",
      .type           = AVMEDIA_TYPE_AUDIO,
-    .id             = CODEC_ID_AMR_NB,
+    .id             = AV_CODEC_ID_AMR_NB,
      .priv_data_size = sizeof(AMRContext),
      .init           = amrnb_decode_init,
      .decode         = amrnb_decode_frame,
-    .long_name      = NULL_IF_CONFIG_SMALL("Adaptive Multi-Rate NarrowBand"),
-    .sample_fmts    = (enum SampleFormat[]){SAMPLE_FMT_FLT,SAMPLE_FMT_NONE},
+    .capabilities   = CODEC_CAP_DR1,
+    .long_name      = NULL_IF_CONFIG_SMALL("AMR-NB (Adaptive Multi-Rate NarrowBand)"),
+    .sample_fmts    = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_FLT,
+                                                     AV_SAMPLE_FMT_NONE },
  };