git.sesse.net Git - ffmpeg/blob - libswscale/swscale_internal.h

   1 /*
   2  * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
   3  *
   4  * This file is part of FFmpeg.
   5  *
   6  * FFmpeg is free software; you can redistribute it and/or
   7  * modify it under the terms of the GNU Lesser General Public
   8  * License as published by the Free Software Foundation; either
   9  * version 2.1 of the License, or (at your option) any later version.
  10  *
  11  * FFmpeg is distributed in the hope that it will be useful,
  12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14  * Lesser General Public License for more details.
  15  *
  16  * You should have received a copy of the GNU Lesser General Public
  17  * License along with FFmpeg; if not, write to the Free Software
  18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19  */
  20
  21 #ifndef SWSCALE_SWSCALE_INTERNAL_H
  22 #define SWSCALE_SWSCALE_INTERNAL_H
  23
  24 #include "config.h"
  25
  26 #if HAVE_ALTIVEC_H
  27 #include <altivec.h>
  28 #endif
  29
  30 #include "libavutil/avutil.h"
  31
  32 #define STR(s)         AV_TOSTRING(s) //AV_STRINGIFY is too long
  33
  34 #define MAX_FILTER_SIZE 256
  35
  36 #if ARCH_X86
  37 #define VOFW 5120
  38 #else
  39 #define VOFW 2048 // faster on PPC and not tested on others
  40 #endif
  41
  42 #define VOF  (VOFW*2)
  43
  44 #if HAVE_BIGENDIAN
  45 #define ALT32_CORR (-1)
  46 #else
  47 #define ALT32_CORR   1
  48 #endif
  49
  50 #if ARCH_X86_64
  51 #   define APCK_PTR2 8
  52 #   define APCK_COEF 16
  53 #   define APCK_SIZE 24
  54 #else
  55 #   define APCK_PTR2 4
  56 #   define APCK_COEF 8
  57 #   define APCK_SIZE 16
  58 #endif
  59
  60 struct SwsContext;
  61
  62 typedef int (*SwsFunc)(struct SwsContext *context, const uint8_t* src[],
  63                        int srcStride[], int srcSliceY, int srcSliceH,
  64                        uint8_t* dst[], int dstStride[]);
  65
  66 /* This struct should be aligned on at least a 32-byte boundary. */
  67 typedef struct SwsContext {
  68     /**
  69      * info on struct for av_log
  70      */
  71     const AVClass *av_class;
  72
  73     /**
  74      * Note that src, dst, srcStride, dstStride will be copied in the
  75      * sws_scale() wrapper so they can be freely modified here.
  76      */
  77     SwsFunc swScale;
  78     int srcW, srcH, dstH;
  79     int chrSrcW, chrSrcH, chrDstW, chrDstH;
  80     int lumXInc, chrXInc;
  81     int lumYInc, chrYInc;
  82     enum PixelFormat dstFormat, srcFormat;  ///< format 4:2:0 type is always YV12
  83     int chrSrcHSubSample, chrSrcVSubSample;
  84     int chrDstHSubSample, chrDstVSubSample;
  85     int vChrDrop;
  86     int sliceDir;
  87     double param[2];
  88
  89     uint32_t pal_yuv[256];
  90     uint32_t pal_rgb[256];
  91
  92     int16_t **lumPixBuf;
  93     int16_t **chrPixBuf;
  94     int16_t **alpPixBuf;
  95     int16_t *hLumFilter;
  96     int16_t *hLumFilterPos;
  97     int16_t *hChrFilter;
  98     int16_t *hChrFilterPos;
  99     int16_t *vLumFilter;
 100     int16_t *vLumFilterPos;
 101     int16_t *vChrFilter;
 102     int16_t *vChrFilterPos;
 103
 104     uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful
 105
 106     int hLumFilterSize;
 107     int hChrFilterSize;
 108     int vLumFilterSize;
 109     int vChrFilterSize;
 110     int vLumBufSize;
 111     int vChrBufSize;
 112
 113     int lumMmx2FilterCodeSize;
 114     int chrMmx2FilterCodeSize;
 115     uint8_t *lumMmx2FilterCode;
 116     uint8_t *chrMmx2FilterCode;
 117
 118     int canMMX2BeUsed;
 119
 120     int lastInLumBuf;
 121     int lastInChrBuf;
 122     int lumBufIndex;
 123     int chrBufIndex;
 124     int dstY;
 125     int flags;
 126     void * yuvTable;            // pointer to the yuv->rgb table start so it can be freed()
 127     uint8_t * table_rV[256];
 128     uint8_t * table_gU[256];
 129     int    table_gV[256];
 130     uint8_t * table_bU[256];
 131
 132     //Colorspace stuff
 133     int contrast, brightness, saturation;    // for sws_getColorspaceDetails
 134     int srcColorspaceTable[4];
 135     int dstColorspaceTable[4];
 136     int srcRange, dstRange;
 137     int yuv2rgb_y_offset;
 138     int yuv2rgb_y_coeff;
 139     int yuv2rgb_v2r_coeff;
 140     int yuv2rgb_v2g_coeff;
 141     int yuv2rgb_u2g_coeff;
 142     int yuv2rgb_u2b_coeff;
 143
 144 #define RED_DITHER            "0*8"
 145 #define GREEN_DITHER          "1*8"
 146 #define BLUE_DITHER           "2*8"
 147 #define Y_COEFF               "3*8"
 148 #define VR_COEFF              "4*8"
 149 #define UB_COEFF              "5*8"
 150 #define VG_COEFF              "6*8"
 151 #define UG_COEFF              "7*8"
 152 #define Y_OFFSET              "8*8"
 153 #define U_OFFSET              "9*8"
 154 #define V_OFFSET              "10*8"
 155 #define LUM_MMX_FILTER_OFFSET "11*8"
 156 #define CHR_MMX_FILTER_OFFSET "11*8+4*4*256"
 157 #define DSTW_OFFSET           "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM
 158 #define ESP_OFFSET            "11*8+4*4*256*2+8"
 159 #define VROUNDER_OFFSET       "11*8+4*4*256*2+16"
 160 #define U_TEMP                "11*8+4*4*256*2+24"
 161 #define V_TEMP                "11*8+4*4*256*2+32"
 162 #define Y_TEMP                "11*8+4*4*256*2+40"
 163 #define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48"
 164
 165     DECLARE_ALIGNED(8, uint64_t, redDither);
 166     DECLARE_ALIGNED(8, uint64_t, greenDither);
 167     DECLARE_ALIGNED(8, uint64_t, blueDither);
 168
 169     DECLARE_ALIGNED(8, uint64_t, yCoeff);
 170     DECLARE_ALIGNED(8, uint64_t, vrCoeff);
 171     DECLARE_ALIGNED(8, uint64_t, ubCoeff);
 172     DECLARE_ALIGNED(8, uint64_t, vgCoeff);
 173     DECLARE_ALIGNED(8, uint64_t, ugCoeff);
 174     DECLARE_ALIGNED(8, uint64_t, yOffset);
 175     DECLARE_ALIGNED(8, uint64_t, uOffset);
 176     DECLARE_ALIGNED(8, uint64_t, vOffset);
 177     int32_t  lumMmxFilter[4*MAX_FILTER_SIZE];
 178     int32_t  chrMmxFilter[4*MAX_FILTER_SIZE];
 179     int dstW;
 180     DECLARE_ALIGNED(8, uint64_t, esp);
 181     DECLARE_ALIGNED(8, uint64_t, vRounder);
 182     DECLARE_ALIGNED(8, uint64_t, u_temp);
 183     DECLARE_ALIGNED(8, uint64_t, v_temp);
 184     DECLARE_ALIGNED(8, uint64_t, y_temp);
 185     int32_t  alpMmxFilter[4*MAX_FILTER_SIZE];
 186
 187 #if HAVE_ALTIVEC
 188     vector signed short   CY;
 189     vector signed short   CRV;
 190     vector signed short   CBU;
 191     vector signed short   CGU;
 192     vector signed short   CGV;
 193     vector signed short   OY;
 194     vector unsigned short CSHIFT;
 195     vector signed short   *vYCoeffsBank, *vCCoeffsBank;
 196 #endif
 197
 198 #if ARCH_BFIN
 199     DECLARE_ALIGNED(4, uint32_t, oy);
 200     DECLARE_ALIGNED(4, uint32_t, oc);
 201     DECLARE_ALIGNED(4, uint32_t, zero);
 202     DECLARE_ALIGNED(4, uint32_t, cy);
 203     DECLARE_ALIGNED(4, uint32_t, crv);
 204     DECLARE_ALIGNED(4, uint32_t, rmask);
 205     DECLARE_ALIGNED(4, uint32_t, cbu);
 206     DECLARE_ALIGNED(4, uint32_t, bmask);
 207     DECLARE_ALIGNED(4, uint32_t, cgu);
 208     DECLARE_ALIGNED(4, uint32_t, cgv);
 209     DECLARE_ALIGNED(4, uint32_t, gmask);
 210 #endif
 211
 212 #if HAVE_VIS
 213     DECLARE_ALIGNED(8, uint64_t, sparc_coeffs[10]);
 214 #endif
 215
 216     /* function pointers for swScale() */
 217     void (*yuv2nv12X  )(struct SwsContext *c,
 218                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 219                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 220                         uint8_t *dest, uint8_t *uDest,
 221                         int dstW, int chrDstW, int dstFormat);
 222     void (*yuv2yuv1   )(struct SwsContext *c,
 223                         const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc,
 224                         uint8_t *dest,
 225                         uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
 226                         long dstW, long chrDstW);
 227     void (*yuv2yuvX   )(struct SwsContext *c,
 228                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 229                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 230                         const int16_t **alpSrc,
 231                         uint8_t *dest,
 232                         uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
 233                         long dstW, long chrDstW);
 234     void (*yuv2packed1)(struct SwsContext *c,
 235                         const uint16_t *buf0,
 236                         const uint16_t *uvbuf0, const uint16_t *uvbuf1,
 237                         const uint16_t *abuf0,
 238                         uint8_t *dest,
 239                         int dstW, int uvalpha, int dstFormat, int flags, int y);
 240     void (*yuv2packed2)(struct SwsContext *c,
 241                         const uint16_t *buf0, const uint16_t *buf1,
 242                         const uint16_t *uvbuf0, const uint16_t *uvbuf1,
 243                         const uint16_t *abuf0, const uint16_t *abuf1,
 244                         uint8_t *dest,
 245                         int dstW, int yalpha, int uvalpha, int y);
 246     void (*yuv2packedX)(struct SwsContext *c,
 247                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 248                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 249                         const int16_t **alpSrc, uint8_t *dest,
 250                         long dstW, long dstY);
 251
 252     void (*lumToYV12)(uint8_t *dst, const uint8_t *src,
 253                       long width, uint32_t *pal); ///< Unscaled conversion of luma plane to YV12 for horizontal scaler.
 254     void (*alpToYV12)(uint8_t *dst, const uint8_t *src,
 255                       long width, uint32_t *pal); ///< Unscaled conversion of alpha plane to YV12 for horizontal scaler.
 256     void (*chrToYV12)(uint8_t *dstU, uint8_t *dstV,
 257                       const uint8_t *src1, const uint8_t *src2,
 258                       long width, uint32_t *pal); ///< Unscaled conversion of chroma planes to YV12 for horizontal scaler.
 259     void (*hyscale_fast)(struct SwsContext *c,
 260                          int16_t *dst, long dstWidth,
 261                          const uint8_t *src, int srcW, int xInc);
 262     void (*hcscale_fast)(struct SwsContext *c,
 263                          int16_t *dst, long dstWidth,
 264                          const uint8_t *src1, const uint8_t *src2,
 265                          int srcW, int xInc);
 266
 267     void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW,
 268                    int xInc, const int16_t *filter, const int16_t *filterPos,
 269                    long filterSize);
 270
 271     void (*lumConvertRange)(uint16_t *dst, int width); ///< Color range conversion function for luma plane if needed.
 272     void (*chrConvertRange)(uint16_t *dst, int width); ///< Color range conversion function for chroma planes if needed.
 273
 274     int lumSrcOffset; ///< Offset given to luma src pointers passed to horizontal input functions.
 275     int chrSrcOffset; ///< Offset given to chroma src pointers passed to horizontal input functions.
 276     int alpSrcOffset; ///< Offset given to alpha src pointers passed to horizontal input functions.
 277
 278     int needs_hcscale; ///< Set if there are chroma planes to be converted.
 279
 280 } SwsContext;
 281 //FIXME check init (where 0)
 282
 283 SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c);
 284 int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
 285                              int fullRange, int brightness,
 286                              int contrast, int saturation);
 287
 288 void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4],
 289                                     int brightness, int contrast, int saturation);
 290 SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c);
 291 SwsFunc ff_yuv2rgb_init_vis(SwsContext *c);
 292 SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c);
 293 SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c);
 294 SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c);
 295 void ff_bfin_get_unscaled_swscale(SwsContext *c);
 296 void ff_yuv2packedX_altivec(SwsContext *c,
 297                             const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
 298                             const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
 299                             uint8_t *dest, int dstW, int dstY);
 300
 301 const char *sws_format_name(enum PixelFormat format);
 302
 303 //FIXME replace this with something faster
 304 #define is16BPS(x)      (           \
 305            (x)==PIX_FMT_GRAY16BE    \
 306         || (x)==PIX_FMT_GRAY16LE    \
 307         || (x)==PIX_FMT_RGB48BE     \
 308         || (x)==PIX_FMT_RGB48LE     \
 309         || (x)==PIX_FMT_YUV420P16LE   \
 310         || (x)==PIX_FMT_YUV422P16LE   \
 311         || (x)==PIX_FMT_YUV444P16LE   \
 312         || (x)==PIX_FMT_YUV420P16BE   \
 313         || (x)==PIX_FMT_YUV422P16BE   \
 314         || (x)==PIX_FMT_YUV444P16BE   \
 315     )
 316 #define isBE(x) ((x)&1)
 317 #define isPlanar8YUV(x) (           \
 318            (x)==PIX_FMT_YUV410P     \
 319         || (x)==PIX_FMT_YUV420P     \
 320         || (x)==PIX_FMT_YUVA420P    \
 321         || (x)==PIX_FMT_YUV411P     \
 322         || (x)==PIX_FMT_YUV422P     \
 323         || (x)==PIX_FMT_YUV444P     \
 324         || (x)==PIX_FMT_YUV440P     \
 325         || (x)==PIX_FMT_NV12        \
 326         || (x)==PIX_FMT_NV21        \
 327     )
 328 #define isPlanarYUV(x)  (           \
 329         isPlanar8YUV(x)             \
 330         || (x)==PIX_FMT_YUV420P16LE   \
 331         || (x)==PIX_FMT_YUV422P16LE   \
 332         || (x)==PIX_FMT_YUV444P16LE   \
 333         || (x)==PIX_FMT_YUV420P16BE   \
 334         || (x)==PIX_FMT_YUV422P16BE   \
 335         || (x)==PIX_FMT_YUV444P16BE   \
 336     )
 337 #define isYUV(x)        (           \
 338            (x)==PIX_FMT_UYVY422     \
 339         || (x)==PIX_FMT_YUYV422     \
 340         || isPlanarYUV(x)           \
 341     )
 342 #define isGray(x)       (           \
 343            (x)==PIX_FMT_GRAY8       \
 344         || (x)==PIX_FMT_GRAY16BE    \
 345         || (x)==PIX_FMT_GRAY16LE    \
 346     )
 347 #define isGray16(x)     (           \
 348            (x)==PIX_FMT_GRAY16BE    \
 349         || (x)==PIX_FMT_GRAY16LE    \
 350     )
 351 #define isRGB(x)        (           \
 352            (x)==PIX_FMT_RGB48BE     \
 353         || (x)==PIX_FMT_RGB48LE     \
 354         || (x)==PIX_FMT_RGB32       \
 355         || (x)==PIX_FMT_RGB32_1     \
 356         || (x)==PIX_FMT_RGB24       \
 357         || (x)==PIX_FMT_RGB565      \
 358         || (x)==PIX_FMT_RGB555      \
 359         || (x)==PIX_FMT_RGB8        \
 360         || (x)==PIX_FMT_RGB4        \
 361         || (x)==PIX_FMT_RGB4_BYTE   \
 362         || (x)==PIX_FMT_MONOBLACK   \
 363         || (x)==PIX_FMT_MONOWHITE   \
 364     )
 365 #define isBGR(x)        (           \
 366            (x)==PIX_FMT_BGR32       \
 367         || (x)==PIX_FMT_BGR32_1     \
 368         || (x)==PIX_FMT_BGR24       \
 369         || (x)==PIX_FMT_BGR565      \
 370         || (x)==PIX_FMT_BGR555      \
 371         || (x)==PIX_FMT_BGR8        \
 372         || (x)==PIX_FMT_BGR4        \
 373         || (x)==PIX_FMT_BGR4_BYTE   \
 374         || (x)==PIX_FMT_MONOBLACK   \
 375         || (x)==PIX_FMT_MONOWHITE   \
 376     )
 377 #define isALPHA(x)      (           \
 378            (x)==PIX_FMT_BGR32       \
 379         || (x)==PIX_FMT_BGR32_1     \
 380         || (x)==PIX_FMT_RGB32       \
 381         || (x)==PIX_FMT_RGB32_1     \
 382         || (x)==PIX_FMT_YUVA420P    \
 383     )
 384
 385 static inline int fmt_depth(int fmt)
 386 {
 387     switch(fmt) {
 388     case PIX_FMT_RGB48BE:
 389     case PIX_FMT_RGB48LE:
 390         return 48;
 391     case PIX_FMT_BGRA:
 392     case PIX_FMT_ABGR:
 393     case PIX_FMT_RGBA:
 394     case PIX_FMT_ARGB:
 395         return 32;
 396     case PIX_FMT_BGR24:
 397     case PIX_FMT_RGB24:
 398         return 24;
 399     case PIX_FMT_BGR565:
 400     case PIX_FMT_RGB565:
 401     case PIX_FMT_GRAY16BE:
 402     case PIX_FMT_GRAY16LE:
 403         return 16;
 404     case PIX_FMT_BGR555:
 405     case PIX_FMT_RGB555:
 406         return 15;
 407     case PIX_FMT_BGR8:
 408     case PIX_FMT_RGB8:
 409         return 8;
 410     case PIX_FMT_BGR4:
 411     case PIX_FMT_RGB4:
 412     case PIX_FMT_BGR4_BYTE:
 413     case PIX_FMT_RGB4_BYTE:
 414         return 4;
 415     case PIX_FMT_MONOBLACK:
 416     case PIX_FMT_MONOWHITE:
 417         return 1;
 418     default:
 419         return 0;
 420     }
 421 }
 422
 423 extern const uint64_t ff_dither4[2];
 424 extern const uint64_t ff_dither8[2];
 425
 426 extern const AVClass sws_context_class;
 427
 428 #endif /* SWSCALE_SWSCALE_INTERNAL_H */