2 * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
4 * This file is part of Libav.
6 * Libav is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * Libav is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with Libav; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
28 #include "swscale_internal.h"
30 #include "libavutil/intreadwrite.h"
31 #include "libavutil/cpu.h"
32 #include "libavutil/avutil.h"
33 #include "libavutil/mathematics.h"
34 #include "libavutil/bswap.h"
35 #include "libavutil/pixdesc.h"
37 DECLARE_ALIGNED(8, const uint8_t, dither_8x8_1)[8][8] = {
38 { 0, 1, 0, 1, 0, 1, 0, 1,},
39 { 1, 0, 1, 0, 1, 0, 1, 0,},
40 { 0, 1, 0, 1, 0, 1, 0, 1,},
41 { 1, 0, 1, 0, 1, 0, 1, 0,},
42 { 0, 1, 0, 1, 0, 1, 0, 1,},
43 { 1, 0, 1, 0, 1, 0, 1, 0,},
44 { 0, 1, 0, 1, 0, 1, 0, 1,},
45 { 1, 0, 1, 0, 1, 0, 1, 0,},
47 DECLARE_ALIGNED(8, const uint8_t, dither_8x8_3)[8][8] = {
48 { 1, 2, 1, 2, 1, 2, 1, 2,},
49 { 3, 0, 3, 0, 3, 0, 3, 0,},
50 { 1, 2, 1, 2, 1, 2, 1, 2,},
51 { 3, 0, 3, 0, 3, 0, 3, 0,},
52 { 1, 2, 1, 2, 1, 2, 1, 2,},
53 { 3, 0, 3, 0, 3, 0, 3, 0,},
54 { 1, 2, 1, 2, 1, 2, 1, 2,},
55 { 3, 0, 3, 0, 3, 0, 3, 0,},
57 DECLARE_ALIGNED(8, const uint8_t, dither_8x8_64)[8][8] = {
58 { 18, 34, 30, 46, 17, 33, 29, 45,},
59 { 50, 2, 62, 14, 49, 1, 61, 13,},
60 { 26, 42, 22, 38, 25, 41, 21, 37,},
61 { 58, 10, 54, 6, 57, 9, 53, 5,},
62 { 16, 32, 28, 44, 19, 35, 31, 47,},
63 { 48, 0, 60, 12, 51, 3, 63, 15,},
64 { 24, 40, 20, 36, 27, 43, 23, 39,},
65 { 56, 8, 52, 4, 59, 11, 55, 7,},
67 extern const uint8_t dither_8x8_128[8][8];
68 DECLARE_ALIGNED(8, const uint8_t, dither_8x8_256)[8][8] = {
69 { 72, 136, 120, 184, 68, 132, 116, 180,},
70 { 200, 8, 248, 56, 196, 4, 244, 52,},
71 { 104, 168, 88, 152, 100, 164, 84, 148,},
72 { 232, 40, 216, 24, 228, 36, 212, 20,},
73 { 64, 128, 102, 176, 76, 140, 124, 188,},
74 { 192, 0, 240, 48, 204, 12, 252, 60,},
75 { 96, 160, 80, 144, 108, 172, 92, 156,},
76 { 224, 32, 208, 16, 236, 44, 220, 28,},
79 #define RGB2YUV_SHIFT 15
80 #define BY ( (int) (0.114 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
81 #define BV (-(int) (0.081 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
82 #define BU ( (int) (0.500 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
83 #define GY ( (int) (0.587 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
84 #define GV (-(int) (0.419 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
85 #define GU (-(int) (0.331 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
86 #define RY ( (int) (0.299 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
87 #define RV ( (int) (0.500 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
88 #define RU (-(int) (0.169 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
90 static void fillPlane(uint8_t *plane, int stride, int width, int height, int y,
94 uint8_t *ptr = plane + stride * y;
95 for (i = 0; i < height; i++) {
96 memset(ptr, val, width);
101 static void copyPlane(const uint8_t *src, int srcStride,
102 int srcSliceY, int srcSliceH, int width,
103 uint8_t *dst, int dstStride)
105 dst += dstStride * srcSliceY;
106 if (dstStride == srcStride && srcStride > 0) {
107 memcpy(dst, src, srcSliceH * dstStride);
110 for (i = 0; i < srcSliceH; i++) {
111 memcpy(dst, src, width);
118 static int planarToNv12Wrapper(SwsContext *c, const uint8_t *src[],
119 int srcStride[], int srcSliceY,
120 int srcSliceH, uint8_t *dstParam[],
123 uint8_t *dst = dstParam[1] + dstStride[1] * srcSliceY / 2;
125 copyPlane(src[0], srcStride[0], srcSliceY, srcSliceH, c->srcW,
126 dstParam[0], dstStride[0]);
128 if (c->dstFormat == PIX_FMT_NV12)
129 interleaveBytes(src[1], src[2], dst, c->srcW / 2, srcSliceH / 2,
130 srcStride[1], srcStride[2], dstStride[0]);
132 interleaveBytes(src[2], src[1], dst, c->srcW / 2, srcSliceH / 2,
133 srcStride[2], srcStride[1], dstStride[0]);
138 static int planarToYuy2Wrapper(SwsContext *c, const uint8_t *src[],
139 int srcStride[], int srcSliceY, int srcSliceH,
140 uint8_t *dstParam[], int dstStride[])
142 uint8_t *dst = dstParam[0] + dstStride[0] * srcSliceY;
144 yv12toyuy2(src[0], src[1], src[2], dst, c->srcW, srcSliceH, srcStride[0],
145 srcStride[1], dstStride[0]);
150 static int planarToUyvyWrapper(SwsContext *c, const uint8_t *src[],
151 int srcStride[], int srcSliceY, int srcSliceH,
152 uint8_t *dstParam[], int dstStride[])
154 uint8_t *dst = dstParam[0] + dstStride[0] * srcSliceY;
156 yv12touyvy(src[0], src[1], src[2], dst, c->srcW, srcSliceH, srcStride[0],
157 srcStride[1], dstStride[0]);
162 static int yuv422pToYuy2Wrapper(SwsContext *c, const uint8_t *src[],
163 int srcStride[], int srcSliceY, int srcSliceH,
164 uint8_t *dstParam[], int dstStride[])
166 uint8_t *dst = dstParam[0] + dstStride[0] * srcSliceY;
168 yuv422ptoyuy2(src[0], src[1], src[2], dst, c->srcW, srcSliceH, srcStride[0],
169 srcStride[1], dstStride[0]);
174 static int yuv422pToUyvyWrapper(SwsContext *c, const uint8_t *src[],
175 int srcStride[], int srcSliceY, int srcSliceH,
176 uint8_t *dstParam[], int dstStride[])
178 uint8_t *dst = dstParam[0] + dstStride[0] * srcSliceY;
180 yuv422ptouyvy(src[0], src[1], src[2], dst, c->srcW, srcSliceH, srcStride[0],
181 srcStride[1], dstStride[0]);
186 static int yuyvToYuv420Wrapper(SwsContext *c, const uint8_t *src[],
187 int srcStride[], int srcSliceY, int srcSliceH,
188 uint8_t *dstParam[], int dstStride[])
190 uint8_t *ydst = dstParam[0] + dstStride[0] * srcSliceY;
191 uint8_t *udst = dstParam[1] + dstStride[1] * srcSliceY / 2;
192 uint8_t *vdst = dstParam[2] + dstStride[2] * srcSliceY / 2;
194 yuyvtoyuv420(ydst, udst, vdst, src[0], c->srcW, srcSliceH, dstStride[0],
195 dstStride[1], srcStride[0]);
198 fillPlane(dstParam[3], dstStride[3], c->srcW, srcSliceH, srcSliceY, 255);
203 static int yuyvToYuv422Wrapper(SwsContext *c, const uint8_t *src[],
204 int srcStride[], int srcSliceY, int srcSliceH,
205 uint8_t *dstParam[], int dstStride[])
207 uint8_t *ydst = dstParam[0] + dstStride[0] * srcSliceY;
208 uint8_t *udst = dstParam[1] + dstStride[1] * srcSliceY;
209 uint8_t *vdst = dstParam[2] + dstStride[2] * srcSliceY;
211 yuyvtoyuv422(ydst, udst, vdst, src[0], c->srcW, srcSliceH, dstStride[0],
212 dstStride[1], srcStride[0]);
217 static int uyvyToYuv420Wrapper(SwsContext *c, const uint8_t *src[],
218 int srcStride[], int srcSliceY, int srcSliceH,
219 uint8_t *dstParam[], int dstStride[])
221 uint8_t *ydst = dstParam[0] + dstStride[0] * srcSliceY;
222 uint8_t *udst = dstParam[1] + dstStride[1] * srcSliceY / 2;
223 uint8_t *vdst = dstParam[2] + dstStride[2] * srcSliceY / 2;
225 uyvytoyuv420(ydst, udst, vdst, src[0], c->srcW, srcSliceH, dstStride[0],
226 dstStride[1], srcStride[0]);
229 fillPlane(dstParam[3], dstStride[3], c->srcW, srcSliceH, srcSliceY, 255);
234 static int uyvyToYuv422Wrapper(SwsContext *c, const uint8_t *src[],
235 int srcStride[], int srcSliceY, int srcSliceH,
236 uint8_t *dstParam[], int dstStride[])
238 uint8_t *ydst = dstParam[0] + dstStride[0] * srcSliceY;
239 uint8_t *udst = dstParam[1] + dstStride[1] * srcSliceY;
240 uint8_t *vdst = dstParam[2] + dstStride[2] * srcSliceY;
242 uyvytoyuv422(ydst, udst, vdst, src[0], c->srcW, srcSliceH, dstStride[0],
243 dstStride[1], srcStride[0]);
248 static void gray8aToPacked32(const uint8_t *src, uint8_t *dst, int num_pixels,
249 const uint8_t *palette)
252 for (i = 0; i < num_pixels; i++)
253 ((uint32_t *) dst)[i] = ((const uint32_t *) palette)[src[i << 1]] | (src[(i << 1) + 1] << 24);
256 static void gray8aToPacked32_1(const uint8_t *src, uint8_t *dst, int num_pixels,
257 const uint8_t *palette)
261 for (i = 0; i < num_pixels; i++)
262 ((uint32_t *) dst)[i] = ((const uint32_t *) palette)[src[i << 1]] | src[(i << 1) + 1];
265 static void gray8aToPacked24(const uint8_t *src, uint8_t *dst, int num_pixels,
266 const uint8_t *palette)
270 for (i = 0; i < num_pixels; i++) {
272 dst[0] = palette[src[i << 1] * 4 + 0];
273 dst[1] = palette[src[i << 1] * 4 + 1];
274 dst[2] = palette[src[i << 1] * 4 + 2];
279 static int packed_16bpc_bswap(SwsContext *c, const uint8_t *src[],
280 int srcStride[], int srcSliceY, int srcSliceH,
281 uint8_t *dst[], int dstStride[])
284 int srcstr = srcStride[0] >> 1;
285 int dststr = dstStride[0] >> 1;
286 uint16_t *dstPtr = (uint16_t *) dst[0];
287 const uint16_t *srcPtr = (const uint16_t *) src[0];
288 int min_stride = FFMIN(srcstr, dststr);
290 for (i = 0; i < srcSliceH; i++) {
291 for (j = 0; j < min_stride; j++) {
292 dstPtr[j] = av_bswap16(srcPtr[j]);
301 static int palToRgbWrapper(SwsContext *c, const uint8_t *src[], int srcStride[],
302 int srcSliceY, int srcSliceH, uint8_t *dst[],
305 const enum PixelFormat srcFormat = c->srcFormat;
306 const enum PixelFormat dstFormat = c->dstFormat;
307 void (*conv)(const uint8_t *src, uint8_t *dst, int num_pixels,
308 const uint8_t *palette) = NULL;
310 uint8_t *dstPtr = dst[0] + dstStride[0] * srcSliceY;
311 const uint8_t *srcPtr = src[0];
313 if (srcFormat == PIX_FMT_Y400A) {
315 case PIX_FMT_RGB32 : conv = gray8aToPacked32; break;
316 case PIX_FMT_BGR32 : conv = gray8aToPacked32; break;
317 case PIX_FMT_BGR32_1: conv = gray8aToPacked32_1; break;
318 case PIX_FMT_RGB32_1: conv = gray8aToPacked32_1; break;
319 case PIX_FMT_RGB24 : conv = gray8aToPacked24; break;
320 case PIX_FMT_BGR24 : conv = gray8aToPacked24; break;
322 } else if (usePal(srcFormat)) {
324 case PIX_FMT_RGB32 : conv = sws_convertPalette8ToPacked32; break;
325 case PIX_FMT_BGR32 : conv = sws_convertPalette8ToPacked32; break;
326 case PIX_FMT_BGR32_1: conv = sws_convertPalette8ToPacked32; break;
327 case PIX_FMT_RGB32_1: conv = sws_convertPalette8ToPacked32; break;
328 case PIX_FMT_RGB24 : conv = sws_convertPalette8ToPacked24; break;
329 case PIX_FMT_BGR24 : conv = sws_convertPalette8ToPacked24; break;
334 av_log(c, AV_LOG_ERROR, "internal error %s -> %s converter\n",
335 sws_format_name(srcFormat), sws_format_name(dstFormat));
337 for (i = 0; i < srcSliceH; i++) {
338 conv(srcPtr, dstPtr, c->srcW, (uint8_t *) c->pal_rgb);
339 srcPtr += srcStride[0];
340 dstPtr += dstStride[0];
347 #define isRGBA32(x) ( \
348 (x) == PIX_FMT_ARGB \
349 || (x) == PIX_FMT_RGBA \
350 || (x) == PIX_FMT_BGRA \
351 || (x) == PIX_FMT_ABGR \
354 /* {RGB,BGR}{15,16,24,32,32_1} -> {RGB,BGR}{15,16,24,32} */
355 static int rgbToRgbWrapper(SwsContext *c, const uint8_t *src[], int srcStride[],
356 int srcSliceY, int srcSliceH, uint8_t *dst[],
359 const enum PixelFormat srcFormat = c->srcFormat;
360 const enum PixelFormat dstFormat = c->dstFormat;
361 const int srcBpp = (c->srcFormatBpp + 7) >> 3;
362 const int dstBpp = (c->dstFormatBpp + 7) >> 3;
363 const int srcId = c->srcFormatBpp;
364 const int dstId = c->dstFormatBpp;
365 void (*conv)(const uint8_t *src, uint8_t *dst, int src_size) = NULL;
367 #define CONV_IS(src, dst) (srcFormat == PIX_FMT_##src && dstFormat == PIX_FMT_##dst)
369 if (isRGBA32(srcFormat) && isRGBA32(dstFormat)) {
370 if ( CONV_IS(ABGR, RGBA)
371 || CONV_IS(ARGB, BGRA)
372 || CONV_IS(BGRA, ARGB)
373 || CONV_IS(RGBA, ABGR)) conv = shuffle_bytes_3210;
374 else if (CONV_IS(ABGR, ARGB)
375 || CONV_IS(ARGB, ABGR)) conv = shuffle_bytes_0321;
376 else if (CONV_IS(ABGR, BGRA)
377 || CONV_IS(ARGB, RGBA)) conv = shuffle_bytes_1230;
378 else if (CONV_IS(BGRA, RGBA)
379 || CONV_IS(RGBA, BGRA)) conv = shuffle_bytes_2103;
380 else if (CONV_IS(BGRA, ABGR)
381 || CONV_IS(RGBA, ARGB)) conv = shuffle_bytes_3012;
384 if ((isBGRinInt(srcFormat) && isBGRinInt(dstFormat)) ||
385 (isRGBinInt(srcFormat) && isRGBinInt(dstFormat))) {
386 switch (srcId | (dstId << 16)) {
387 case 0x000F0010: conv = rgb16to15; break;
388 case 0x000F0018: conv = rgb24to15; break;
389 case 0x000F0020: conv = rgb32to15; break;
390 case 0x0010000F: conv = rgb15to16; break;
391 case 0x00100018: conv = rgb24to16; break;
392 case 0x00100020: conv = rgb32to16; break;
393 case 0x0018000F: conv = rgb15to24; break;
394 case 0x00180010: conv = rgb16to24; break;
395 case 0x00180020: conv = rgb32to24; break;
396 case 0x0020000F: conv = rgb15to32; break;
397 case 0x00200010: conv = rgb16to32; break;
398 case 0x00200018: conv = rgb24to32; break;
400 } else if ((isBGRinInt(srcFormat) && isRGBinInt(dstFormat)) ||
401 (isRGBinInt(srcFormat) && isBGRinInt(dstFormat))) {
402 switch (srcId | (dstId << 16)) {
403 case 0x000C000C: conv = rgb12tobgr12; break;
404 case 0x000F000F: conv = rgb15tobgr15; break;
405 case 0x000F0010: conv = rgb16tobgr15; break;
406 case 0x000F0018: conv = rgb24tobgr15; break;
407 case 0x000F0020: conv = rgb32tobgr15; break;
408 case 0x0010000F: conv = rgb15tobgr16; break;
409 case 0x00100010: conv = rgb16tobgr16; break;
410 case 0x00100018: conv = rgb24tobgr16; break;
411 case 0x00100020: conv = rgb32tobgr16; break;
412 case 0x0018000F: conv = rgb15tobgr24; break;
413 case 0x00180010: conv = rgb16tobgr24; break;
414 case 0x00180018: conv = rgb24tobgr24; break;
415 case 0x00180020: conv = rgb32tobgr24; break;
416 case 0x0020000F: conv = rgb15tobgr32; break;
417 case 0x00200010: conv = rgb16tobgr32; break;
418 case 0x00200018: conv = rgb24tobgr32; break;
423 av_log(c, AV_LOG_ERROR, "internal error %s -> %s converter\n",
424 sws_format_name(srcFormat), sws_format_name(dstFormat));
426 const uint8_t *srcPtr = src[0];
427 uint8_t *dstPtr = dst[0];
428 if ((srcFormat == PIX_FMT_RGB32_1 || srcFormat == PIX_FMT_BGR32_1) &&
429 !isRGBA32(dstFormat))
430 srcPtr += ALT32_CORR;
432 if ((dstFormat == PIX_FMT_RGB32_1 || dstFormat == PIX_FMT_BGR32_1) &&
433 !isRGBA32(srcFormat))
434 dstPtr += ALT32_CORR;
436 if (dstStride[0] * srcBpp == srcStride[0] * dstBpp && srcStride[0] > 0 &&
437 !(srcStride[0] % srcBpp))
438 conv(srcPtr, dstPtr + dstStride[0] * srcSliceY,
439 srcSliceH * srcStride[0]);
442 dstPtr += dstStride[0] * srcSliceY;
444 for (i = 0; i < srcSliceH; i++) {
445 conv(srcPtr, dstPtr, c->srcW * srcBpp);
446 srcPtr += srcStride[0];
447 dstPtr += dstStride[0];
454 static int bgr24ToYv12Wrapper(SwsContext *c, const uint8_t *src[],
455 int srcStride[], int srcSliceY, int srcSliceH,
456 uint8_t *dst[], int dstStride[])
460 dst[0] + srcSliceY * dstStride[0],
461 dst[1] + (srcSliceY >> 1) * dstStride[1],
462 dst[2] + (srcSliceY >> 1) * dstStride[2],
464 dstStride[0], dstStride[1], srcStride[0]);
466 fillPlane(dst[3], dstStride[3], c->srcW, srcSliceH, srcSliceY, 255);
470 static int yvu9ToYv12Wrapper(SwsContext *c, const uint8_t *src[],
471 int srcStride[], int srcSliceY, int srcSliceH,
472 uint8_t *dst[], int dstStride[])
474 copyPlane(src[0], srcStride[0], srcSliceY, srcSliceH, c->srcW,
475 dst[0], dstStride[0]);
477 planar2x(src[1], dst[1] + dstStride[1] * (srcSliceY >> 1), c->chrSrcW,
478 srcSliceH >> 2, srcStride[1], dstStride[1]);
479 planar2x(src[2], dst[2] + dstStride[2] * (srcSliceY >> 1), c->chrSrcW,
480 srcSliceH >> 2, srcStride[2], dstStride[2]);
482 fillPlane(dst[3], dstStride[3], c->srcW, srcSliceH, srcSliceY, 255);
486 /* unscaled copy like stuff (assumes nearly identical formats) */
487 static int packedCopyWrapper(SwsContext *c, const uint8_t *src[],
488 int srcStride[], int srcSliceY, int srcSliceH,
489 uint8_t *dst[], int dstStride[])
491 if (dstStride[0] == srcStride[0] && srcStride[0] > 0)
492 memcpy(dst[0] + dstStride[0] * srcSliceY, src[0], srcSliceH * dstStride[0]);
495 const uint8_t *srcPtr = src[0];
496 uint8_t *dstPtr = dst[0] + dstStride[0] * srcSliceY;
499 /* universal length finder */
500 while (length + c->srcW <= FFABS(dstStride[0]) &&
501 length + c->srcW <= FFABS(srcStride[0]))
505 for (i = 0; i < srcSliceH; i++) {
506 memcpy(dstPtr, srcPtr, length);
507 srcPtr += srcStride[0];
508 dstPtr += dstStride[0];
514 #define clip9(x) av_clip_uintp2(x, 9)
515 #define clip10(x) av_clip_uintp2(x, 10)
516 #define DITHER_COPY(dst, dstStride, wfunc, src, srcStride, rfunc, dithers, shift, clip) \
517 for (i = 0; i < height; i++) { \
518 const uint8_t *dither = dithers[i & 7]; \
519 for (j = 0; j < length - 7; j += 8) { \
520 wfunc(&dst[j + 0], clip((rfunc(&src[j + 0]) + dither[0]) >> shift)); \
521 wfunc(&dst[j + 1], clip((rfunc(&src[j + 1]) + dither[1]) >> shift)); \
522 wfunc(&dst[j + 2], clip((rfunc(&src[j + 2]) + dither[2]) >> shift)); \
523 wfunc(&dst[j + 3], clip((rfunc(&src[j + 3]) + dither[3]) >> shift)); \
524 wfunc(&dst[j + 4], clip((rfunc(&src[j + 4]) + dither[4]) >> shift)); \
525 wfunc(&dst[j + 5], clip((rfunc(&src[j + 5]) + dither[5]) >> shift)); \
526 wfunc(&dst[j + 6], clip((rfunc(&src[j + 6]) + dither[6]) >> shift)); \
527 wfunc(&dst[j + 7], clip((rfunc(&src[j + 7]) + dither[7]) >> shift)); \
529 for (; j < length; j++) \
530 wfunc(&dst[j], (rfunc(&src[j]) + dither[j & 7]) >> shift); \
535 static int planarCopyWrapper(SwsContext *c, const uint8_t *src[],
536 int srcStride[], int srcSliceY, int srcSliceH,
537 uint8_t *dst[], int dstStride[])
540 for (plane = 0; plane < 4; plane++) {
541 int length = (plane == 0 || plane == 3) ? c->srcW : -((-c->srcW ) >> c->chrDstHSubSample);
542 int y = (plane == 0 || plane == 3) ? srcSliceY: -((-srcSliceY) >> c->chrDstVSubSample);
543 int height = (plane == 0 || plane == 3) ? srcSliceH: -((-srcSliceH) >> c->chrDstVSubSample);
544 const uint8_t *srcPtr = src[plane];
545 uint8_t *dstPtr = dst[plane] + dstStride[plane] * y;
549 // ignore palette for GRAY8
550 if (plane == 1 && !dst[2]) continue;
551 if (!src[plane] || (plane == 1 && !src[2])) {
552 if (is16BPS(c->dstFormat))
554 fillPlane(dst[plane], dstStride[plane], length, height, y,
555 (plane == 3) ? 255 : 128);
557 if (is9_OR_10BPS(c->srcFormat)) {
558 const int src_depth = av_pix_fmt_descriptors[c->srcFormat].comp[plane].depth_minus1 + 1;
559 const int dst_depth = av_pix_fmt_descriptors[c->dstFormat].comp[plane].depth_minus1 + 1;
560 const uint16_t *srcPtr2 = (const uint16_t *) srcPtr;
562 if (is16BPS(c->dstFormat)) {
563 uint16_t *dstPtr2 = (uint16_t *) dstPtr;
564 #define COPY9_OR_10TO16(rfunc, wfunc) \
565 for (i = 0; i < height; i++) { \
566 for (j = 0; j < length; j++) { \
567 int srcpx = rfunc(&srcPtr2[j]); \
568 wfunc(&dstPtr2[j], (srcpx << (16 - src_depth)) | (srcpx >> (2 * src_depth - 16))); \
570 dstPtr2 += dstStride[plane] / 2; \
571 srcPtr2 += srcStride[plane] / 2; \
573 if (isBE(c->dstFormat)) {
574 if (isBE(c->srcFormat)) {
575 COPY9_OR_10TO16(AV_RB16, AV_WB16);
577 COPY9_OR_10TO16(AV_RL16, AV_WB16);
580 if (isBE(c->srcFormat)) {
581 COPY9_OR_10TO16(AV_RB16, AV_WL16);
583 COPY9_OR_10TO16(AV_RL16, AV_WL16);
586 } else if (is9_OR_10BPS(c->dstFormat)) {
587 uint16_t *dstPtr2 = (uint16_t *) dstPtr;
588 #define COPY9_OR_10TO9_OR_10(loop) \
589 for (i = 0; i < height; i++) { \
590 for (j = 0; j < length; j++) { \
593 dstPtr2 += dstStride[plane] / 2; \
594 srcPtr2 += srcStride[plane] / 2; \
596 #define COPY9_OR_10TO9_OR_10_2(rfunc, wfunc) \
597 if (dst_depth > src_depth) { \
598 COPY9_OR_10TO9_OR_10(int srcpx = rfunc(&srcPtr2[j]); \
599 wfunc(&dstPtr2[j], (srcpx << 1) | (srcpx >> 9))); \
600 } else if (dst_depth < src_depth) { \
601 DITHER_COPY(dstPtr2, dstStride[plane] / 2, wfunc, \
602 srcPtr2, srcStride[plane] / 2, rfunc, \
603 dither_8x8_1, 1, clip9); \
605 COPY9_OR_10TO9_OR_10(wfunc(&dstPtr2[j], rfunc(&srcPtr2[j]))); \
607 if (isBE(c->dstFormat)) {
608 if (isBE(c->srcFormat)) {
609 COPY9_OR_10TO9_OR_10_2(AV_RB16, AV_WB16);
611 COPY9_OR_10TO9_OR_10_2(AV_RL16, AV_WB16);
614 if (isBE(c->srcFormat)) {
615 COPY9_OR_10TO9_OR_10_2(AV_RB16, AV_WL16);
617 COPY9_OR_10TO9_OR_10_2(AV_RL16, AV_WL16);
621 #define W8(a, b) { *(a) = (b); }
622 #define COPY9_OR_10TO8(rfunc) \
623 if (src_depth == 9) { \
624 DITHER_COPY(dstPtr, dstStride[plane], W8, \
625 srcPtr2, srcStride[plane] / 2, rfunc, \
626 dither_8x8_1, 1, av_clip_uint8); \
628 DITHER_COPY(dstPtr, dstStride[plane], W8, \
629 srcPtr2, srcStride[plane] / 2, rfunc, \
630 dither_8x8_3, 2, av_clip_uint8); \
632 if (isBE(c->srcFormat)) {
633 COPY9_OR_10TO8(AV_RB16);
635 COPY9_OR_10TO8(AV_RL16);
638 } else if (is9_OR_10BPS(c->dstFormat)) {
639 const int dst_depth = av_pix_fmt_descriptors[c->dstFormat].comp[plane].depth_minus1 + 1;
640 uint16_t *dstPtr2 = (uint16_t *) dstPtr;
642 if (is16BPS(c->srcFormat)) {
643 const uint16_t *srcPtr2 = (const uint16_t *) srcPtr;
644 #define COPY16TO9_OR_10(rfunc, wfunc) \
645 if (dst_depth == 9) { \
646 DITHER_COPY(dstPtr2, dstStride[plane] / 2, wfunc, \
647 srcPtr2, srcStride[plane] / 2, rfunc, \
648 dither_8x8_128, 7, clip9); \
650 DITHER_COPY(dstPtr2, dstStride[plane] / 2, wfunc, \
651 srcPtr2, srcStride[plane] / 2, rfunc, \
652 dither_8x8_64, 6, clip10); \
654 if (isBE(c->dstFormat)) {
655 if (isBE(c->srcFormat)) {
656 COPY16TO9_OR_10(AV_RB16, AV_WB16);
658 COPY16TO9_OR_10(AV_RL16, AV_WB16);
661 if (isBE(c->srcFormat)) {
662 COPY16TO9_OR_10(AV_RB16, AV_WL16);
664 COPY16TO9_OR_10(AV_RL16, AV_WL16);
668 #define COPY8TO9_OR_10(wfunc) \
669 for (i = 0; i < height; i++) { \
670 for (j = 0; j < length; j++) { \
671 const int srcpx = srcPtr[j]; \
672 wfunc(&dstPtr2[j], (srcpx << (dst_depth - 8)) | (srcpx >> (16 - dst_depth))); \
674 dstPtr2 += dstStride[plane] / 2; \
675 srcPtr += srcStride[plane]; \
677 if (isBE(c->dstFormat)) {
678 COPY8TO9_OR_10(AV_WB16);
680 COPY8TO9_OR_10(AV_WL16);
683 } else if (is16BPS(c->srcFormat) && !is16BPS(c->dstFormat)) {
684 const uint16_t *srcPtr2 = (const uint16_t *) srcPtr;
685 #define COPY16TO8(rfunc) \
686 DITHER_COPY(dstPtr, dstStride[plane], W8, \
687 srcPtr2, srcStride[plane] / 2, rfunc, \
688 dither_8x8_256, 8, av_clip_uint8);
689 if (isBE(c->srcFormat)) {
694 } else if (!is16BPS(c->srcFormat) && is16BPS(c->dstFormat)) {
695 for (i = 0; i < height; i++) {
696 for (j = 0; j < length; j++) {
697 dstPtr[ j << 1 ] = srcPtr[j];
698 dstPtr[(j << 1) + 1] = srcPtr[j];
700 srcPtr += srcStride[plane];
701 dstPtr += dstStride[plane];
703 } else if (is16BPS(c->srcFormat) && is16BPS(c->dstFormat) &&
704 isBE(c->srcFormat) != isBE(c->dstFormat)) {
706 for (i = 0; i < height; i++) {
707 for (j = 0; j < length; j++)
708 ((uint16_t *) dstPtr)[j] = av_bswap16(((const uint16_t *) srcPtr)[j]);
709 srcPtr += srcStride[plane];
710 dstPtr += dstStride[plane];
712 } else if (dstStride[plane] == srcStride[plane] &&
713 srcStride[plane] > 0 && srcStride[plane] == length) {
714 memcpy(dst[plane] + dstStride[plane] * y, src[plane],
715 height * dstStride[plane]);
717 if (is16BPS(c->srcFormat) && is16BPS(c->dstFormat))
719 for (i = 0; i < height; i++) {
720 memcpy(dstPtr, srcPtr, length);
721 srcPtr += srcStride[plane];
722 dstPtr += dstStride[plane];
731 #define IS_DIFFERENT_ENDIANESS(src_fmt, dst_fmt, pix_fmt) \
732 ((src_fmt == pix_fmt ## BE && dst_fmt == pix_fmt ## LE) || \
733 (src_fmt == pix_fmt ## LE && dst_fmt == pix_fmt ## BE))
736 void ff_get_unscaled_swscale(SwsContext *c)
738 const enum PixelFormat srcFormat = c->srcFormat;
739 const enum PixelFormat dstFormat = c->dstFormat;
740 const int flags = c->flags;
741 const int dstH = c->dstH;
744 needsDither = isAnyRGB(dstFormat) &&
745 c->dstFormatBpp < 24 &&
746 (c->dstFormatBpp < c->srcFormatBpp || (!isAnyRGB(srcFormat)));
749 if ((srcFormat == PIX_FMT_YUV420P || srcFormat == PIX_FMT_YUVA420P) &&
750 (dstFormat == PIX_FMT_NV12 || dstFormat == PIX_FMT_NV21)) {
751 c->swScale = planarToNv12Wrapper;
754 if ((srcFormat == PIX_FMT_YUV420P || srcFormat == PIX_FMT_YUV422P ||
755 srcFormat == PIX_FMT_YUVA420P) && isAnyRGB(dstFormat) &&
756 !(flags & SWS_ACCURATE_RND) && !(dstH & 1)) {
757 c->swScale = ff_yuv2rgb_get_func_ptr(c);
760 if (srcFormat == PIX_FMT_YUV410P &&
761 (dstFormat == PIX_FMT_YUV420P || dstFormat == PIX_FMT_YUVA420P) &&
762 !(flags & SWS_BITEXACT)) {
763 c->swScale = yvu9ToYv12Wrapper;
767 if (srcFormat == PIX_FMT_BGR24 &&
768 (dstFormat == PIX_FMT_YUV420P || dstFormat == PIX_FMT_YUVA420P) &&
769 !(flags & SWS_ACCURATE_RND))
770 c->swScale = bgr24ToYv12Wrapper;
772 /* RGB/BGR -> RGB/BGR (no dither needed forms) */
773 if ( isAnyRGB(srcFormat)
774 && isAnyRGB(dstFormat)
775 && srcFormat != PIX_FMT_BGR8 && dstFormat != PIX_FMT_BGR8
776 && srcFormat != PIX_FMT_RGB8 && dstFormat != PIX_FMT_RGB8
777 && srcFormat != PIX_FMT_BGR4 && dstFormat != PIX_FMT_BGR4
778 && srcFormat != PIX_FMT_RGB4 && dstFormat != PIX_FMT_RGB4
779 && srcFormat != PIX_FMT_BGR4_BYTE && dstFormat != PIX_FMT_BGR4_BYTE
780 && srcFormat != PIX_FMT_RGB4_BYTE && dstFormat != PIX_FMT_RGB4_BYTE
781 && srcFormat != PIX_FMT_MONOBLACK && dstFormat != PIX_FMT_MONOBLACK
782 && srcFormat != PIX_FMT_MONOWHITE && dstFormat != PIX_FMT_MONOWHITE
783 && srcFormat != PIX_FMT_RGB48LE && dstFormat != PIX_FMT_RGB48LE
784 && srcFormat != PIX_FMT_RGB48BE && dstFormat != PIX_FMT_RGB48BE
785 && srcFormat != PIX_FMT_BGR48LE && dstFormat != PIX_FMT_BGR48LE
786 && srcFormat != PIX_FMT_BGR48BE && dstFormat != PIX_FMT_BGR48BE
787 && (!needsDither || (c->flags&(SWS_FAST_BILINEAR|SWS_POINT))))
788 c->swScale= rgbToRgbWrapper;
790 /* bswap 16 bits per pixel/component packed formats */
791 if (IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_BGR444) ||
792 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_BGR48) ||
793 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_BGR555) ||
794 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_BGR565) ||
795 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_GRAY16) ||
796 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_RGB444) ||
797 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_RGB48) ||
798 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_RGB555) ||
799 IS_DIFFERENT_ENDIANESS(srcFormat, dstFormat, PIX_FMT_RGB565))
800 c->swScale = packed_16bpc_bswap;
802 if ((usePal(srcFormat) && (
803 dstFormat == PIX_FMT_RGB32 ||
804 dstFormat == PIX_FMT_RGB32_1 ||
805 dstFormat == PIX_FMT_RGB24 ||
806 dstFormat == PIX_FMT_BGR32 ||
807 dstFormat == PIX_FMT_BGR32_1 ||
808 dstFormat == PIX_FMT_BGR24)))
809 c->swScale = palToRgbWrapper;
811 if (srcFormat == PIX_FMT_YUV422P) {
812 if (dstFormat == PIX_FMT_YUYV422)
813 c->swScale = yuv422pToYuy2Wrapper;
814 else if (dstFormat == PIX_FMT_UYVY422)
815 c->swScale = yuv422pToUyvyWrapper;
818 /* LQ converters if -sws 0 or -sws 4*/
819 if (c->flags&(SWS_FAST_BILINEAR|SWS_POINT)) {
821 if (srcFormat == PIX_FMT_YUV420P || srcFormat == PIX_FMT_YUVA420P) {
822 if (dstFormat == PIX_FMT_YUYV422)
823 c->swScale = planarToYuy2Wrapper;
824 else if (dstFormat == PIX_FMT_UYVY422)
825 c->swScale = planarToUyvyWrapper;
828 if (srcFormat == PIX_FMT_YUYV422 &&
829 (dstFormat == PIX_FMT_YUV420P || dstFormat == PIX_FMT_YUVA420P))
830 c->swScale = yuyvToYuv420Wrapper;
831 if (srcFormat == PIX_FMT_UYVY422 &&
832 (dstFormat == PIX_FMT_YUV420P || dstFormat == PIX_FMT_YUVA420P))
833 c->swScale = uyvyToYuv420Wrapper;
834 if (srcFormat == PIX_FMT_YUYV422 && dstFormat == PIX_FMT_YUV422P)
835 c->swScale = yuyvToYuv422Wrapper;
836 if (srcFormat == PIX_FMT_UYVY422 && dstFormat == PIX_FMT_YUV422P)
837 c->swScale = uyvyToYuv422Wrapper;
840 if ( srcFormat == dstFormat ||
841 (srcFormat == PIX_FMT_YUVA420P && dstFormat == PIX_FMT_YUV420P) ||
842 (srcFormat == PIX_FMT_YUV420P && dstFormat == PIX_FMT_YUVA420P) ||
843 (isPlanarYUV(srcFormat) && isGray(dstFormat)) ||
844 (isPlanarYUV(dstFormat) && isGray(srcFormat)) ||
845 (isGray(dstFormat) && isGray(srcFormat)) ||
846 (isPlanarYUV(srcFormat) && isPlanarYUV(dstFormat) &&
847 c->chrDstHSubSample == c->chrSrcHSubSample &&
848 c->chrDstVSubSample == c->chrSrcVSubSample &&
849 dstFormat != PIX_FMT_NV12 && dstFormat != PIX_FMT_NV21 &&
850 srcFormat != PIX_FMT_NV12 && srcFormat != PIX_FMT_NV21))
852 if (isPacked(c->srcFormat))
853 c->swScale = packedCopyWrapper;
854 else /* Planar YUV or gray */
855 c->swScale = planarCopyWrapper;
859 ff_bfin_get_unscaled_swscale(c);
861 ff_swscale_get_unscaled_altivec(c);
864 static void reset_ptr(const uint8_t *src[], int format)
866 if (!isALPHA(format))
868 if (!isPlanar(format)) {
869 src[3] = src[2] = NULL;
876 static int check_image_pointers(uint8_t *data[4], enum PixelFormat pix_fmt,
877 const int linesizes[4])
879 const AVPixFmtDescriptor *desc = &av_pix_fmt_descriptors[pix_fmt];
882 for (i = 0; i < 4; i++) {
883 int plane = desc->comp[i].plane;
884 if (!data[plane] || !linesizes[plane])
892 * swscale wrapper, so we don't need to export the SwsContext.
893 * Assumes planar YUV to be in YUV order instead of YVU.
895 int attribute_align_arg sws_scale(struct SwsContext *c,
896 const uint8_t * const srcSlice[],
897 const int srcStride[], int srcSliceY,
898 int srcSliceH, uint8_t *const dst[],
899 const int dstStride[])
902 const uint8_t *src2[4] = { srcSlice[0], srcSlice[1], srcSlice[2], srcSlice[3] };
903 uint8_t *dst2[4] = { dst[0], dst[1], dst[2], dst[3] };
905 // do not mess up sliceDir if we have a "trailing" 0-size slice
909 if (!check_image_pointers(srcSlice, c->srcFormat, srcStride)) {
910 av_log(c, AV_LOG_ERROR, "bad src image pointers\n");
913 if (!check_image_pointers(dst, c->dstFormat, dstStride)) {
914 av_log(c, AV_LOG_ERROR, "bad dst image pointers\n");
918 if (c->sliceDir == 0 && srcSliceY != 0 && srcSliceY + srcSliceH != c->srcH) {
919 av_log(c, AV_LOG_ERROR, "Slices start in the middle!\n");
922 if (c->sliceDir == 0) {
923 if (srcSliceY == 0) c->sliceDir = 1; else c->sliceDir = -1;
926 if (usePal(c->srcFormat)) {
927 for (i = 0; i < 256; i++) {
928 int p, r, g, b, y, u, v;
929 if (c->srcFormat == PIX_FMT_PAL8) {
930 p = ((const uint32_t *)(srcSlice[1]))[i];
931 r = (p >> 16) & 0xFF;
934 } else if (c->srcFormat == PIX_FMT_RGB8) {
936 g = ((i >> 2) & 7) * 36;
938 } else if (c->srcFormat == PIX_FMT_BGR8) {
940 g = ((i >> 3) & 7) * 36;
942 } else if (c->srcFormat == PIX_FMT_RGB4_BYTE) {
943 r = ( i >> 3 ) * 255;
944 g = ((i >> 1) & 3) * 85;
946 } else if (c->srcFormat == PIX_FMT_GRAY8 ||
947 c->srcFormat == PIX_FMT_Y400A) {
950 assert(c->srcFormat == PIX_FMT_BGR4_BYTE);
951 b = ( i >> 3 ) * 255;
952 g = ((i >> 1) & 3) * 85;
955 y = av_clip_uint8((RY * r + GY * g + BY * b + ( 33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
956 u = av_clip_uint8((RU * r + GU * g + BU * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
957 v = av_clip_uint8((RV * r + GV * g + BV * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
958 c->pal_yuv[i] = y + (u << 8) + (v << 16);
960 switch (c->dstFormat) {
965 c->pal_rgb[i] = r + (g << 8) + (b << 16);
967 case PIX_FMT_BGR32_1:
971 c->pal_rgb[i] = (r + (g << 8) + (b << 16)) << 8;
973 case PIX_FMT_RGB32_1:
977 c->pal_rgb[i] = (b + (g << 8) + (r << 16)) << 8;
984 c->pal_rgb[i] = b + (g << 8) + (r << 16);
989 // copy strides, so they can safely be modified
990 if (c->sliceDir == 1) {
991 // slices go from top to bottom
992 int srcStride2[4] = { srcStride[0], srcStride[1], srcStride[2],
994 int dstStride2[4] = { dstStride[0], dstStride[1], dstStride[2],
997 reset_ptr(src2, c->srcFormat);
998 reset_ptr((const uint8_t **) dst2, c->dstFormat);
1000 /* reset slice direction at end of frame */
1001 if (srcSliceY + srcSliceH == c->srcH)
1004 return c->swScale(c, src2, srcStride2, srcSliceY, srcSliceH, dst2,
1007 // slices go from bottom to top => we flip the image internally
1008 int srcStride2[4] = { -srcStride[0], -srcStride[1], -srcStride[2],
1010 int dstStride2[4] = { -dstStride[0], -dstStride[1], -dstStride[2],
1013 src2[0] += (srcSliceH - 1) * srcStride[0];
1014 if (!usePal(c->srcFormat))
1015 src2[1] += ((srcSliceH >> c->chrSrcVSubSample) - 1) * srcStride[1];
1016 src2[2] += ((srcSliceH >> c->chrSrcVSubSample) - 1) * srcStride[2];
1017 src2[3] += (srcSliceH - 1) * srcStride[3];
1018 dst2[0] += ( c->dstH - 1) * dstStride[0];
1019 dst2[1] += ((c->dstH >> c->chrDstVSubSample) - 1) * dstStride[1];
1020 dst2[2] += ((c->dstH >> c->chrDstVSubSample) - 1) * dstStride[2];
1021 dst2[3] += ( c->dstH - 1) * dstStride[3];
1023 reset_ptr(src2, c->srcFormat);
1024 reset_ptr((const uint8_t **) dst2, c->dstFormat);
1026 /* reset slice direction at end of frame */
1030 return c->swScale(c, src2, srcStride2, c->srcH-srcSliceY-srcSliceH,
1031 srcSliceH, dst2, dstStride2);
1035 /* Convert the palette to the same packed 32-bit format as the palette */
1036 void sws_convertPalette8ToPacked32(const uint8_t *src, uint8_t *dst,
1037 int num_pixels, const uint8_t *palette)
1041 for (i = 0; i < num_pixels; i++)
1042 ((uint32_t *) dst)[i] = ((const uint32_t *) palette)[src[i]];
1045 /* Palette format: ABCD -> dst format: ABC */
1046 void sws_convertPalette8ToPacked24(const uint8_t *src, uint8_t *dst,
1047 int num_pixels, const uint8_t *palette)
1051 for (i = 0; i < num_pixels; i++) {
1053 dst[0] = palette[src[i] * 4 + 0];
1054 dst[1] = palette[src[i] * 4 + 1];
1055 dst[2] = palette[src[i] * 4 + 2];