x86: rename dsputil.asm to idctdsp.asm

[ffmpeg] / libavcodec / dsputil.h
diff --git a/libavcodec/dsputil.h b/libavcodec/dsputil.h

index b271dccf823c99b4a07c42cb7f0d480a9bcee6a1..0871dbe62d5d56765cabaae865536104292dfea9 100644 (file)
--- a/libavcodec/dsputil.h
+++ b/libavcodec/dsputil.h
@@ -3,20 +3,20 @@
   * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
   * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
   *
- * This file is part of Libav.
+ * This file is part of FFmpeg.
   *
- * Libav is free software; you can redistribute it and/or
+ * FFmpeg is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
   * License as published by the Free Software Foundation; either
   * version 2.1 of the License, or (at your option) any later version.
   *
- * Libav is distributed in the hope that it will be useful,
+ * FFmpeg is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * Lesser General Public License for more details.
   *
   * You should have received a copy of the GNU Lesser General Public
- * License along with Libav; if not, write to the Free Software
+ * License along with FFmpeg; if not, write to the Free Software
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
@@ -34,6 +34,20 @@
  
  extern uint32_t ff_square_tab[512];
  
+
+/* minimum alignment rules ;)
+ * If you notice errors in the align stuff, need more alignment for some ASM code
+ * for some CPU or need to use a function with less aligned data then send a mail
+ * to the ffmpeg-devel mailing list, ...
+ *
+ * !warning These alignments might not match reality, (missing attribute((align))
+ * stuff somewhere possible).
+ * I (Michael) did not check them, these are just the alignments which I think
+ * could be reached easily ...
+ *
+ * !future video codecs might need functions with less strict alignment
+ */
+
  struct MpegEncContext;
  /* Motion estimation:
   * h is limited to { width / 2, width, 2 * width },
@@ -44,22 +58,6 @@ typedef int (*me_cmp_func)(struct MpegEncContext *c,
                             uint8_t *blk1 /* align width (8 or 16) */,
                             uint8_t *blk2 /* align 1 */, int line_size, int h);
  
-/**
- * Scantable.
- */
-typedef struct ScanTable {
-    const uint8_t *scantable;
-    uint8_t permutated[64];
-    uint8_t raster_end[64];
-} ScanTable;
-
-void ff_init_scantable(uint8_t *permutation, ScanTable *st,
-                       const uint8_t *src_scantable);
-void ff_init_scantable_permutation(uint8_t *idct_permutation,
-                                   int idct_permutation_type);
-int ff_init_scantable_permutation_x86(uint8_t *idct_permutation,
-                                      int idct_permutation_type);
-
  /**
   * DSPContext.
   */
@@ -72,15 +70,6 @@ typedef struct DSPContext {
                          const uint8_t *s1 /* align 8 */,
                          const uint8_t *s2 /* align 8 */,
                          int stride);
-    void (*put_pixels_clamped)(const int16_t *block /* align 16 */,
-                               uint8_t *pixels /* align 8 */,
-                               int line_size);
-    void (*put_signed_pixels_clamped)(const int16_t *block /* align 16 */,
-                                      uint8_t *pixels /* align 8 */,
-                                      int line_size);
-    void (*add_pixels_clamped)(const int16_t *block /* align 16 */,
-                               uint8_t *pixels /* align 8 */,
-                               int line_size);
      int (*sum_abs_dctelem)(int16_t *block /* align 16 */);
  
      int (*pix_sum)(uint8_t *pix, int line_size);
@@ -96,6 +85,8 @@ typedef struct DSPContext {
      me_cmp_func vsad[6];
      me_cmp_func vsse[6];
      me_cmp_func nsse[6];
+    me_cmp_func w53[6];
+    me_cmp_func w97[6];
      me_cmp_func dct_max[6];
      me_cmp_func dct264_sad[6];
  
@@ -112,47 +103,6 @@ typedef struct DSPContext {
      void (*fdct)(int16_t *block /* align 16 */);
      void (*fdct248)(int16_t *block /* align 16 */);
  
-    /* IDCT really */
-    void (*idct)(int16_t *block /* align 16 */);
-
-    /**
-     * block -> idct -> clip to unsigned 8 bit -> dest.
-     * (-1392, 0, 0, ...) -> idct -> (-174, -174, ...) -> put -> (0, 0, ...)
-     * @param line_size size in bytes of a horizontal line of dest
-     */
-    void (*idct_put)(uint8_t *dest /* align 8 */,
-                     int line_size, int16_t *block /* align 16 */);
-
-    /**
-     * block -> idct -> add dest -> clip to unsigned 8 bit -> dest.
-     * @param line_size size in bytes of a horizontal line of dest
-     */
-    void (*idct_add)(uint8_t *dest /* align 8 */,
-                     int line_size, int16_t *block /* align 16 */);
-
-    /**
-     * IDCT input permutation.
-     * Several optimized IDCTs need a permutated input (relative to the
-     * normal order of the reference IDCT).
-     * This permutation must be performed before the idct_put/add.
-     * Note, normally this can be merged with the zigzag/alternate scan<br>
-     * An example to avoid confusion:
-     * - (->decode coeffs -> zigzag reorder -> dequant -> reference IDCT -> ...)
-     * - (x -> reference DCT -> reference IDCT -> x)
-     * - (x -> reference DCT -> simple_mmx_perm = idct_permutation
-     *    -> simple_idct_mmx -> x)
-     * - (-> decode coeffs -> zigzag reorder -> simple_mmx_perm -> dequant
-     *    -> simple_idct_mmx -> ...)
-     */
-    uint8_t idct_permutation[64];
-    int idct_permutation_type;
-#define FF_NO_IDCT_PERM 1
-#define FF_LIBMPEG2_IDCT_PERM 2
-#define FF_SIMPLE_IDCT_PERM 3
-#define FF_TRANSPOSE_IDCT_PERM 4
-#define FF_PARTTRANS_IDCT_PERM 5
-#define FF_SSE2_IDCT_PERM 6
-
      int (*try_8x8basis)(int16_t rem[64], int16_t weight[64],
                          int16_t basis[64], int scale);
      void (*add_8x8basis)(int16_t rem[64], int16_t basis[64], int scale);
@@ -171,9 +121,14 @@ typedef struct DSPContext {
  
  void ff_dsputil_static_init(void);
  void ff_dsputil_init(DSPContext *p, AVCodecContext *avctx);
+void avpriv_dsputil_init(DSPContext* p, AVCodecContext *avctx);
+attribute_deprecated void dsputil_init(DSPContext* c, AVCodecContext *avctx);
+
+int ff_check_alignment(void);
  
  void ff_set_cmp(DSPContext *c, me_cmp_func *cmp, int type);
  
+void ff_dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx);
  void ff_dsputil_init_arm(DSPContext *c, AVCodecContext *avctx,
                           unsigned high_bit_depth);
  void ff_dsputil_init_ppc(DSPContext *c, AVCodecContext *avctx,
@@ -181,4 +136,6 @@ void ff_dsputil_init_ppc(DSPContext *c, AVCodecContext *avctx,
  void ff_dsputil_init_x86(DSPContext *c, AVCodecContext *avctx,
                           unsigned high_bit_depth);
  
+void ff_dsputil_init_dwt(DSPContext *c);
+
  #endif /* AVCODEC_DSPUTIL_H */