Use reget_buffer instead of get_buffer. Fixes issue1367.

[ffmpeg] / libavcodec / dsputil.h
diff --git a/libavcodec/dsputil.h b/libavcodec/dsputil.h

index 2a0542038301d7ef2ac1e303bf6a191270060665..db19e3f07681445bb4d598181aff8d0a964f44f8 100644 (file)
--- a/libavcodec/dsputil.h
+++ b/libavcodec/dsputil.h
@@ -319,6 +319,7 @@ typedef struct DSPContext {
      h264_chroma_mc_func avg_h264_chroma_pixels_tab[3];
      /* This is really one func used in VC-1 decoding */
      h264_chroma_mc_func put_no_rnd_vc1_chroma_pixels_tab[3];
+    h264_chroma_mc_func avg_no_rnd_vc1_chroma_pixels_tab[3];
  
      qpel_mc_func put_h264_qpel_pixels_tab[4][16];
      qpel_mc_func avg_h264_qpel_pixels_tab[4][16];
@@ -395,6 +396,7 @@ typedef struct DSPContext {
      void (*vector_fmul_window)(float *dst, const float *src0, const float *src1, const float *win, float add_bias, int len);
      /* assume len is a multiple of 8, and arrays are 16-byte aligned */
      void (*int32_to_float_fmul_scalar)(float *dst, const int *src, float mul, int len);
+    void (*vector_clipf)(float *dst /* align 16 */, const float *src /* align 16 */, float min, float max, int len /* align 16 */);
  
      /* C version: convert floats from the range [384.0,386.0] to ints in [-32768,32767]
       * simd versions: convert floats from [-32768.0,32767.0] without rescaling and arrays are 16byte aligned */
@@ -474,13 +476,29 @@ typedef struct DSPContext {
  
      void (*shrink[4])(uint8_t *dst, int dst_wrap, const uint8_t *src, int src_wrap, int width, int height);
  
+    /* mlp/truehd functions */
+    void (*mlp_filter_channel)(int32_t *state, const int32_t *coeff,
+                               int firorder, int iirorder,
+                               unsigned int filter_shift, int32_t mask, int blocksize,
+                               int32_t *sample_buffer);
+
      /* vc1 functions */
      void (*vc1_inv_trans_8x8)(DCTELEM *b);
      void (*vc1_inv_trans_8x4)(uint8_t *dest, int line_size, DCTELEM *block);
      void (*vc1_inv_trans_4x8)(uint8_t *dest, int line_size, DCTELEM *block);
      void (*vc1_inv_trans_4x4)(uint8_t *dest, int line_size, DCTELEM *block);
+    void (*vc1_inv_trans_8x8_dc)(uint8_t *dest, int line_size, DCTELEM *block);
+    void (*vc1_inv_trans_8x4_dc)(uint8_t *dest, int line_size, DCTELEM *block);
+    void (*vc1_inv_trans_4x8_dc)(uint8_t *dest, int line_size, DCTELEM *block);
+    void (*vc1_inv_trans_4x4_dc)(uint8_t *dest, int line_size, DCTELEM *block);
      void (*vc1_v_overlap)(uint8_t* src, int stride);
      void (*vc1_h_overlap)(uint8_t* src, int stride);
+    void (*vc1_v_loop_filter4)(uint8_t *src, int stride, int pq);
+    void (*vc1_h_loop_filter4)(uint8_t *src, int stride, int pq);
+    void (*vc1_v_loop_filter8)(uint8_t *src, int stride, int pq);
+    void (*vc1_h_loop_filter8)(uint8_t *src, int stride, int pq);
+    void (*vc1_v_loop_filter16)(uint8_t *src, int stride, int pq);
+    void (*vc1_h_loop_filter16)(uint8_t *src, int stride, int pq);
      /* put 8x8 block with bicubic interpolation and quarterpel precision
       * last argument is actually round value instead of height
       */
@@ -580,6 +598,7 @@ static inline int get_penalty_factor(int lambda, int lambda2, int type){
  /* should be defined by architectures supporting
     one or more MultiMedia extension */
  int mm_support(void);
+extern int mm_flags;
  
  void dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx);
  void dsputil_init_arm(DSPContext* c, AVCodecContext *avctx);
@@ -592,17 +611,12 @@ void dsputil_init_sh4(DSPContext* c, AVCodecContext *avctx);
  void dsputil_init_vis(DSPContext* c, AVCodecContext *avctx);
  
  #define DECLARE_ALIGNED_16(t, v) DECLARE_ALIGNED(16, t, v)
+#define DECLARE_ALIGNED_8(t, v)  DECLARE_ALIGNED(8, t, v)
  
  #if HAVE_MMX
  
  #undef emms_c
  
-extern int mm_flags;
-
-void add_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);
-void put_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);
-void put_signed_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);
-
  static inline void emms(void)
  {
      __asm__ volatile ("emms;":::"memory");
@@ -615,27 +629,18 @@ static inline void emms(void)
          emms();\
  }
  
-void dsputil_init_pix_mmx(DSPContext* c, AVCodecContext *avctx);
-
  #elif ARCH_ARM
  
-extern int mm_flags;
-
  #if HAVE_NEON
-#   define DECLARE_ALIGNED_8(t, v) DECLARE_ALIGNED(16, t, v)
  #   define STRIDE_ALIGN 16
  #endif
  
  #elif ARCH_PPC
  
-extern int mm_flags;
-
-#define DECLARE_ALIGNED_8(t, v) DECLARE_ALIGNED(16, t, v)
  #define STRIDE_ALIGN 16
  
  #elif HAVE_MMI
  
-#define DECLARE_ALIGNED_8(t, v) DECLARE_ALIGNED(16, t, v)
  #define STRIDE_ALIGN 16
  
  #else
@@ -645,10 +650,6 @@ extern int mm_flags;
  
  #endif
  
-#ifndef DECLARE_ALIGNED_8
-#   define DECLARE_ALIGNED_8(t, v) DECLARE_ALIGNED(8, t, v)
-#endif
-
  #ifndef STRIDE_ALIGN
  #   define STRIDE_ALIGN 8
  #endif
@@ -683,7 +684,7 @@ typedef struct FFTContext {
      void (*imdct_half)(struct MDCTContext *s, FFTSample *output, const FFTSample *input);
  } FFTContext;
  
-extern FFTSample* ff_cos_tabs[13];
+extern FFTSample* const ff_cos_tabs[13];
  
  /**
   * Sets up a complex FFT.
@@ -693,11 +694,13 @@ extern FFTSample* ff_cos_tabs[13];
  int ff_fft_init(FFTContext *s, int nbits, int inverse);
  void ff_fft_permute_c(FFTContext *s, FFTComplex *z);
  void ff_fft_permute_sse(FFTContext *s, FFTComplex *z);
+void ff_fft_permute_neon(FFTContext *s, FFTComplex *z);
  void ff_fft_calc_c(FFTContext *s, FFTComplex *z);
  void ff_fft_calc_sse(FFTContext *s, FFTComplex *z);
  void ff_fft_calc_3dn(FFTContext *s, FFTComplex *z);
  void ff_fft_calc_3dn2(FFTContext *s, FFTComplex *z);
  void ff_fft_calc_altivec(FFTContext *s, FFTComplex *z);
+void ff_fft_calc_neon(FFTContext *s, FFTComplex *z);
  
  /**
   * Do the permutation needed BEFORE calling ff_fft_calc().
@@ -756,9 +759,9 @@ extern float ff_sine_512 [ 512];
  extern float ff_sine_1024[1024];
  extern float ff_sine_2048[2048];
  extern float ff_sine_4096[4096];
-extern float *ff_sine_windows[6];
+extern float * const ff_sine_windows[6];
  
-int ff_mdct_init(MDCTContext *s, int nbits, int inverse);
+int ff_mdct_init(MDCTContext *s, int nbits, int inverse, double scale);
  void ff_imdct_calc_c(MDCTContext *s, FFTSample *output, const FFTSample *input);
  void ff_imdct_half_c(MDCTContext *s, FFTSample *output, const FFTSample *input);
  void ff_imdct_calc_3dn(MDCTContext *s, FFTSample *output, const FFTSample *input);
@@ -767,6 +770,8 @@ void ff_imdct_calc_3dn2(MDCTContext *s, FFTSample *output, const FFTSample *inpu
  void ff_imdct_half_3dn2(MDCTContext *s, FFTSample *output, const FFTSample *input);
  void ff_imdct_calc_sse(MDCTContext *s, FFTSample *output, const FFTSample *input);
  void ff_imdct_half_sse(MDCTContext *s, FFTSample *output, const FFTSample *input);
+void ff_imdct_calc_neon(MDCTContext *s, FFTSample *output, const FFTSample *input);
+void ff_imdct_half_neon(MDCTContext *s, FFTSample *output, const FFTSample *input);
  void ff_mdct_calc(MDCTContext *s, FFTSample *out, const FFTSample *input);
  void ff_mdct_end(MDCTContext *s);