2 * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
4 * This file is part of Libav.
6 * Libav is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * Libav is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with Libav; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
27 #include "libavutil/avutil.h"
28 #include "libavutil/bswap.h"
29 #include "libavutil/cpu.h"
30 #include "libavutil/intreadwrite.h"
31 #include "libavutil/mathematics.h"
32 #include "libavutil/pixdesc.h"
36 #include "swscale_internal.h"
38 #define RGB2YUV_SHIFT 15
39 #define BY ((int)(0.114 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
40 #define BV (-(int)(0.081 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
41 #define BU ((int)(0.500 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
42 #define GY ((int)(0.587 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
43 #define GV (-(int)(0.419 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
44 #define GU (-(int)(0.331 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
45 #define RY ((int)(0.299 * 219 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
46 #define RV ((int)(0.500 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
47 #define RU (-(int)(0.169 * 224 / 255 * (1 << RGB2YUV_SHIFT) + 0.5))
49 #define input_pixel(pos) (isBE(origin) ? AV_RB16(pos) : AV_RL16(pos))
51 #define r ((origin == PIX_FMT_BGR48BE || origin == PIX_FMT_BGR48LE) ? b_r : r_b)
52 #define b ((origin == PIX_FMT_BGR48BE || origin == PIX_FMT_BGR48LE) ? r_b : b_r)
54 static av_always_inline void rgb48ToY_c_template(uint16_t *dst,
55 const uint16_t *src, int width,
56 enum PixelFormat origin)
59 for (i = 0; i < width; i++) {
60 unsigned int r_b = input_pixel(&src[i * 3 + 0]);
61 unsigned int g = input_pixel(&src[i * 3 + 1]);
62 unsigned int b_r = input_pixel(&src[i * 3 + 2]);
64 dst[i] = (RY * r + GY * g + BY * b + (0x2001 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
68 static av_always_inline void rgb48ToUV_c_template(uint16_t *dstU,
73 enum PixelFormat origin)
77 for (i = 0; i < width; i++) {
78 int r_b = input_pixel(&src1[i * 3 + 0]);
79 int g = input_pixel(&src1[i * 3 + 1]);
80 int b_r = input_pixel(&src1[i * 3 + 2]);
82 dstU[i] = (RU * r + GU * g + BU * b + (0x10001 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
83 dstV[i] = (RV * r + GV * g + BV * b + (0x10001 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
87 static av_always_inline void rgb48ToUV_half_c_template(uint16_t *dstU,
92 enum PixelFormat origin)
96 for (i = 0; i < width; i++) {
97 int r_b = (input_pixel(&src1[6 * i + 0]) +
98 input_pixel(&src1[6 * i + 3]) + 1) >> 1;
99 int g = (input_pixel(&src1[6 * i + 1]) +
100 input_pixel(&src1[6 * i + 4]) + 1) >> 1;
101 int b_r = (input_pixel(&src1[6 * i + 2]) +
102 input_pixel(&src1[6 * i + 5]) + 1) >> 1;
104 dstU[i] = (RU * r + GU * g + BU * b + (0x10001 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
105 dstV[i] = (RV * r + GV * g + BV * b + (0x10001 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
113 #define rgb48funcs(pattern, BE_LE, origin) \
114 static void pattern ## 48 ## BE_LE ## ToY_c(uint8_t *_dst, \
115 const uint8_t *_src, \
119 const uint16_t *src = (const uint16_t *)_src; \
120 uint16_t *dst = (uint16_t *)_dst; \
121 rgb48ToY_c_template(dst, src, width, origin); \
124 static void pattern ## 48 ## BE_LE ## ToUV_c(uint8_t *_dstU, \
126 const uint8_t *_src1, \
127 const uint8_t *_src2, \
131 const uint16_t *src1 = (const uint16_t *)_src1, \
132 *src2 = (const uint16_t *)_src2; \
133 uint16_t *dstU = (uint16_t *)_dstU, \
134 *dstV = (uint16_t *)_dstV; \
135 rgb48ToUV_c_template(dstU, dstV, src1, src2, width, origin); \
138 static void pattern ## 48 ## BE_LE ## ToUV_half_c(uint8_t *_dstU, \
140 const uint8_t *_src1, \
141 const uint8_t *_src2, \
145 const uint16_t *src1 = (const uint16_t *)_src1, \
146 *src2 = (const uint16_t *)_src2; \
147 uint16_t *dstU = (uint16_t *)_dstU, \
148 *dstV = (uint16_t *)_dstV; \
149 rgb48ToUV_half_c_template(dstU, dstV, src1, src2, width, origin); \
152 rgb48funcs(rgb, LE, PIX_FMT_RGB48LE)
153 rgb48funcs(rgb, BE, PIX_FMT_RGB48BE)
154 rgb48funcs(bgr, LE, PIX_FMT_BGR48LE)
155 rgb48funcs(bgr, BE, PIX_FMT_BGR48BE)
157 #define input_pixel(i) ((origin == PIX_FMT_RGBA || \
158 origin == PIX_FMT_BGRA || \
159 origin == PIX_FMT_ARGB || \
160 origin == PIX_FMT_ABGR) \
161 ? AV_RN32A(&src[(i) * 4]) \
162 : (isBE(origin) ? AV_RB16(&src[(i) * 2]) \
163 : AV_RL16(&src[(i) * 2])))
165 static av_always_inline void rgb16_32ToY_c_template(uint8_t *dst,
168 enum PixelFormat origin,
171 int maskr, int maskg,
173 int gsh, int bsh, int S)
175 const int ry = RY << rsh, gy = GY << gsh, by = BY << bsh;
176 const unsigned rnd = 33u << (S - 1);
179 for (i = 0; i < width; i++) {
180 int px = input_pixel(i) >> shp;
181 int b = (px & maskb) >> shb;
182 int g = (px & maskg) >> shg;
183 int r = (px & maskr) >> shr;
185 dst[i] = (ry * r + gy * g + by * b + rnd) >> S;
189 static av_always_inline void rgb16_32ToUV_c_template(uint8_t *dstU,
193 enum PixelFormat origin,
196 int maskr, int maskg,
198 int gsh, int bsh, int S)
200 const int ru = RU << rsh, gu = GU << gsh, bu = BU << bsh,
201 rv = RV << rsh, gv = GV << gsh, bv = BV << bsh;
202 const unsigned rnd = 257u << (S - 1);
205 for (i = 0; i < width; i++) {
206 int px = input_pixel(i) >> shp;
207 int b = (px & maskb) >> shb;
208 int g = (px & maskg) >> shg;
209 int r = (px & maskr) >> shr;
211 dstU[i] = (ru * r + gu * g + bu * b + rnd) >> S;
212 dstV[i] = (rv * r + gv * g + bv * b + rnd) >> S;
216 static av_always_inline void rgb16_32ToUV_half_c_template(uint8_t *dstU,
220 enum PixelFormat origin,
223 int maskr, int maskg,
225 int gsh, int bsh, int S)
227 const int ru = RU << rsh, gu = GU << gsh, bu = BU << bsh,
228 rv = RV << rsh, gv = GV << gsh, bv = BV << bsh,
229 maskgx = ~(maskr | maskb);
230 const unsigned rnd = 257u << S;
236 for (i = 0; i < width; i++) {
237 int px0 = input_pixel(2 * i + 0) >> shp;
238 int px1 = input_pixel(2 * i + 1) >> shp;
239 int b, r, g = (px0 & maskgx) + (px1 & maskgx);
240 int rb = px0 + px1 - g;
242 b = (rb & maskb) >> shb;
244 origin == PIX_FMT_BGR565LE || origin == PIX_FMT_BGR565BE ||
245 origin == PIX_FMT_RGB565LE || origin == PIX_FMT_RGB565BE) {
248 g = (g & maskg) >> shg;
250 r = (rb & maskr) >> shr;
252 dstU[i] = (ru * r + gu * g + bu * b + rnd) >> (S + 1);
253 dstV[i] = (rv * r + gv * g + bv * b + rnd) >> (S + 1);
259 #define rgb16_32_wrapper(fmt, name, shr, shg, shb, shp, maskr, \
260 maskg, maskb, rsh, gsh, bsh, S) \
261 static void name ## ToY_c(uint8_t *dst, const uint8_t *src, \
262 int width, uint32_t *unused) \
264 rgb16_32ToY_c_template(dst, src, width, fmt, shr, shg, shb, shp, \
265 maskr, maskg, maskb, rsh, gsh, bsh, S); \
268 static void name ## ToUV_c(uint8_t *dstU, uint8_t *dstV, \
269 const uint8_t *src, const uint8_t *dummy, \
270 int width, uint32_t *unused) \
272 rgb16_32ToUV_c_template(dstU, dstV, src, width, fmt, \
273 shr, shg, shb, shp, \
274 maskr, maskg, maskb, rsh, gsh, bsh, S); \
277 static void name ## ToUV_half_c(uint8_t *dstU, uint8_t *dstV, \
278 const uint8_t *src, \
279 const uint8_t *dummy, \
280 int width, uint32_t *unused) \
282 rgb16_32ToUV_half_c_template(dstU, dstV, src, width, fmt, \
283 shr, shg, shb, shp, \
284 maskr, maskg, maskb, \
288 rgb16_32_wrapper(PIX_FMT_BGR32, bgr32, 16, 0, 0, 0, 0xFF0000, 0xFF00, 0x00FF, 8, 0, 8, RGB2YUV_SHIFT + 8)
289 rgb16_32_wrapper(PIX_FMT_BGR32_1, bgr321, 16, 0, 0, 8, 0xFF0000, 0xFF00, 0x00FF, 8, 0, 8, RGB2YUV_SHIFT + 8)
290 rgb16_32_wrapper(PIX_FMT_RGB32, rgb32, 0, 0, 16, 0, 0x00FF, 0xFF00, 0xFF0000, 8, 0, 8, RGB2YUV_SHIFT + 8)
291 rgb16_32_wrapper(PIX_FMT_RGB32_1, rgb321, 0, 0, 16, 8, 0x00FF, 0xFF00, 0xFF0000, 8, 0, 8, RGB2YUV_SHIFT + 8)
292 rgb16_32_wrapper(PIX_FMT_BGR565LE, bgr16le, 0, 0, 0, 0, 0x001F, 0x07E0, 0xF800, 11, 5, 0, RGB2YUV_SHIFT + 8)
293 rgb16_32_wrapper(PIX_FMT_BGR555LE, bgr15le, 0, 0, 0, 0, 0x001F, 0x03E0, 0x7C00, 10, 5, 0, RGB2YUV_SHIFT + 7)
294 rgb16_32_wrapper(PIX_FMT_BGR444LE, bgr12le, 0, 0, 0, 0, 0x000F, 0x00F0, 0x0F00, 8, 4, 0, RGB2YUV_SHIFT + 4)
295 rgb16_32_wrapper(PIX_FMT_RGB565LE, rgb16le, 0, 0, 0, 0, 0xF800, 0x07E0, 0x001F, 0, 5, 11, RGB2YUV_SHIFT + 8)
296 rgb16_32_wrapper(PIX_FMT_RGB555LE, rgb15le, 0, 0, 0, 0, 0x7C00, 0x03E0, 0x001F, 0, 5, 10, RGB2YUV_SHIFT + 7)
297 rgb16_32_wrapper(PIX_FMT_RGB444LE, rgb12le, 0, 0, 0, 0, 0x0F00, 0x00F0, 0x000F, 0, 4, 8, RGB2YUV_SHIFT + 4)
298 rgb16_32_wrapper(PIX_FMT_BGR565BE, bgr16be, 0, 0, 0, 0, 0x001F, 0x07E0, 0xF800, 11, 5, 0, RGB2YUV_SHIFT + 8)
299 rgb16_32_wrapper(PIX_FMT_BGR555BE, bgr15be, 0, 0, 0, 0, 0x001F, 0x03E0, 0x7C00, 10, 5, 0, RGB2YUV_SHIFT + 7)
300 rgb16_32_wrapper(PIX_FMT_BGR444BE, bgr12be, 0, 0, 0, 0, 0x000F, 0x00F0, 0x0F00, 8, 4, 0, RGB2YUV_SHIFT + 4)
301 rgb16_32_wrapper(PIX_FMT_RGB565BE, rgb16be, 0, 0, 0, 0, 0xF800, 0x07E0, 0x001F, 0, 5, 11, RGB2YUV_SHIFT + 8)
302 rgb16_32_wrapper(PIX_FMT_RGB555BE, rgb15be, 0, 0, 0, 0, 0x7C00, 0x03E0, 0x001F, 0, 5, 10, RGB2YUV_SHIFT + 7)
303 rgb16_32_wrapper(PIX_FMT_RGB444BE, rgb12be, 0, 0, 0, 0, 0x0F00, 0x00F0, 0x000F, 0, 4, 8, RGB2YUV_SHIFT + 4)
305 static void abgrToA_c(uint8_t *dst, const uint8_t *src, int width,
309 for (i = 0; i < width; i++)
313 static void rgbaToA_c(uint8_t *dst, const uint8_t *src, int width,
317 for (i = 0; i < width; i++)
318 dst[i] = src[4 * i + 3];
321 static void palToY_c(uint8_t *dst, const uint8_t *src, int width, uint32_t *pal)
324 for (i = 0; i < width; i++) {
327 dst[i] = pal[d] & 0xFF;
331 static void palToUV_c(uint8_t *dstU, uint8_t *dstV,
332 const uint8_t *src1, const uint8_t *src2,
333 int width, uint32_t *pal)
336 assert(src1 == src2);
337 for (i = 0; i < width; i++) {
338 int p = pal[src1[i]];
345 static void monowhite2Y_c(uint8_t *dst, const uint8_t *src,
346 int width, uint32_t *unused)
349 width = (width + 7) >> 3;
350 for (i = 0; i < width; i++) {
352 for (j = 0; j < 8; j++)
353 dst[8 * i + j] = ((d >> (7 - j)) & 1) * 255;
357 static void monoblack2Y_c(uint8_t *dst, const uint8_t *src,
358 int width, uint32_t *unused)
361 width = (width + 7) >> 3;
362 for (i = 0; i < width; i++) {
364 for (j = 0; j < 8; j++)
365 dst[8 * i + j] = ((d >> (7 - j)) & 1) * 255;
369 static void yuy2ToY_c(uint8_t *dst, const uint8_t *src, int width,
373 for (i = 0; i < width; i++)
377 static void yuy2ToUV_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
378 const uint8_t *src2, int width, uint32_t *unused)
381 for (i = 0; i < width; i++) {
382 dstU[i] = src1[4 * i + 1];
383 dstV[i] = src1[4 * i + 3];
385 assert(src1 == src2);
388 static void bswap16Y_c(uint8_t *_dst, const uint8_t *_src, int width,
392 const uint16_t *src = (const uint16_t *)_src;
393 uint16_t *dst = (uint16_t *)_dst;
394 for (i = 0; i < width; i++)
395 dst[i] = av_bswap16(src[i]);
398 static void bswap16UV_c(uint8_t *_dstU, uint8_t *_dstV, const uint8_t *_src1,
399 const uint8_t *_src2, int width, uint32_t *unused)
402 const uint16_t *src1 = (const uint16_t *)_src1,
403 *src2 = (const uint16_t *)_src2;
404 uint16_t *dstU = (uint16_t *)_dstU, *dstV = (uint16_t *)_dstV;
405 for (i = 0; i < width; i++) {
406 dstU[i] = av_bswap16(src1[i]);
407 dstV[i] = av_bswap16(src2[i]);
411 /* This is almost identical to the previous, end exists only because
412 * yuy2ToY/UV)(dst, src + 1, ...) would have 100% unaligned accesses. */
413 static void uyvyToY_c(uint8_t *dst, const uint8_t *src, int width,
417 for (i = 0; i < width; i++)
418 dst[i] = src[2 * i + 1];
421 static void uyvyToUV_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
422 const uint8_t *src2, int width, uint32_t *unused)
425 for (i = 0; i < width; i++) {
426 dstU[i] = src1[4 * i + 0];
427 dstV[i] = src1[4 * i + 2];
429 assert(src1 == src2);
432 static av_always_inline void nvXXtoUV_c(uint8_t *dst1, uint8_t *dst2,
433 const uint8_t *src, int width)
436 for (i = 0; i < width; i++) {
437 dst1[i] = src[2 * i + 0];
438 dst2[i] = src[2 * i + 1];
442 static void nv12ToUV_c(uint8_t *dstU, uint8_t *dstV,
443 const uint8_t *src1, const uint8_t *src2,
444 int width, uint32_t *unused)
446 nvXXtoUV_c(dstU, dstV, src1, width);
449 static void nv21ToUV_c(uint8_t *dstU, uint8_t *dstV,
450 const uint8_t *src1, const uint8_t *src2,
451 int width, uint32_t *unused)
453 nvXXtoUV_c(dstV, dstU, src1, width);
456 #define input_pixel(pos) (isBE(origin) ? AV_RB16(pos) : AV_RL16(pos))
458 static void bgr24ToY_c(uint8_t *dst, const uint8_t *src,
459 int width, uint32_t *unused)
462 for (i = 0; i < width; i++) {
463 int b = src[i * 3 + 0];
464 int g = src[i * 3 + 1];
465 int r = src[i * 3 + 2];
467 dst[i] = ((RY * r + GY * g + BY * b + (33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
471 static void bgr24ToUV_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
472 const uint8_t *src2, int width, uint32_t *unused)
475 for (i = 0; i < width; i++) {
476 int b = src1[3 * i + 0];
477 int g = src1[3 * i + 1];
478 int r = src1[3 * i + 2];
480 dstU[i] = (RU * r + GU * g + BU * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
481 dstV[i] = (RV * r + GV * g + BV * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
483 assert(src1 == src2);
486 static void bgr24ToUV_half_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
487 const uint8_t *src2, int width, uint32_t *unused)
490 for (i = 0; i < width; i++) {
491 int b = src1[6 * i + 0] + src1[6 * i + 3];
492 int g = src1[6 * i + 1] + src1[6 * i + 4];
493 int r = src1[6 * i + 2] + src1[6 * i + 5];
495 dstU[i] = (RU * r + GU * g + BU * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
496 dstV[i] = (RV * r + GV * g + BV * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
498 assert(src1 == src2);
501 static void rgb24ToY_c(uint8_t *dst, const uint8_t *src, int width,
505 for (i = 0; i < width; i++) {
506 int r = src[i * 3 + 0];
507 int g = src[i * 3 + 1];
508 int b = src[i * 3 + 2];
510 dst[i] = ((RY * r + GY * g + BY * b + (33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
514 static void rgb24ToUV_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
515 const uint8_t *src2, int width, uint32_t *unused)
518 assert(src1 == src2);
519 for (i = 0; i < width; i++) {
520 int r = src1[3 * i + 0];
521 int g = src1[3 * i + 1];
522 int b = src1[3 * i + 2];
524 dstU[i] = (RU * r + GU * g + BU * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
525 dstV[i] = (RV * r + GV * g + BV * b + (257 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT;
529 static void rgb24ToUV_half_c(uint8_t *dstU, uint8_t *dstV, const uint8_t *src1,
530 const uint8_t *src2, int width, uint32_t *unused)
533 assert(src1 == src2);
534 for (i = 0; i < width; i++) {
535 int r = src1[6 * i + 0] + src1[6 * i + 3];
536 int g = src1[6 * i + 1] + src1[6 * i + 4];
537 int b = src1[6 * i + 2] + src1[6 * i + 5];
539 dstU[i] = (RU * r + GU * g + BU * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
540 dstV[i] = (RV * r + GV * g + BV * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
544 static void planar_rgb_to_y(uint8_t *dst, const uint8_t *src[4], int width)
547 for (i = 0; i < width; i++) {
552 dst[i] = ((RY * r + GY * g + BY * b + (33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
556 static void planar_rgb16le_to_y(uint8_t *_dst, const uint8_t *_src[4], int width)
559 const uint16_t **src = (const uint16_t **)_src;
560 uint16_t *dst = (uint16_t *)_dst;
561 for (i = 0; i < width; i++) {
562 int g = AV_RL16(src[0] + i);
563 int b = AV_RL16(src[1] + i);
564 int r = AV_RL16(src[2] + i);
566 dst[i] = ((RY * r + GY * g + BY * b + (33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
570 static void planar_rgb16be_to_y(uint8_t *_dst, const uint8_t *_src[4], int width)
573 const uint16_t **src = (const uint16_t **)_src;
574 uint16_t *dst = (uint16_t *)_dst;
575 for (i = 0; i < width; i++) {
576 int g = AV_RB16(src[0] + i);
577 int b = AV_RB16(src[1] + i);
578 int r = AV_RB16(src[2] + i);
580 dst[i] = ((RY * r + GY * g + BY * b + (33 << (RGB2YUV_SHIFT - 1))) >> RGB2YUV_SHIFT);
584 static void planar_rgb_to_uv(uint8_t *dstU, uint8_t *dstV, const uint8_t *src[4], int width)
587 for (i = 0; i < width; i++) {
592 dstU[i] = (RU * r + GU * g + BU * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
593 dstV[i] = (RV * r + GV * g + BV * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
597 static void planar_rgb16le_to_uv(uint8_t *_dstU, uint8_t *_dstV,
598 const uint8_t *_src[4], int width)
601 const uint16_t **src = (const uint16_t **)_src;
602 uint16_t *dstU = (uint16_t *)_dstU;
603 uint16_t *dstV = (uint16_t *)_dstV;
604 for (i = 0; i < width; i++) {
605 int g = AV_RL16(src[0] + i);
606 int b = AV_RL16(src[1] + i);
607 int r = AV_RL16(src[2] + i);
609 dstU[i] = (RU * r + GU * g + BU * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
610 dstV[i] = (RV * r + GV * g + BV * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
614 static void planar_rgb16be_to_uv(uint8_t *_dstU, uint8_t *_dstV,
615 const uint8_t *_src[4], int width)
618 const uint16_t **src = (const uint16_t **)_src;
619 uint16_t *dstU = (uint16_t *)_dstU;
620 uint16_t *dstV = (uint16_t *)_dstV;
621 for (i = 0; i < width; i++) {
622 int g = AV_RB16(src[0] + i);
623 int b = AV_RB16(src[1] + i);
624 int r = AV_RB16(src[2] + i);
626 dstU[i] = (RU * r + GU * g + BU * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
627 dstV[i] = (RV * r + GV * g + BV * b + (257 << RGB2YUV_SHIFT)) >> (RGB2YUV_SHIFT + 1);
631 av_cold void ff_sws_init_input_funcs(SwsContext *c)
633 enum PixelFormat srcFormat = c->srcFormat;
637 case PIX_FMT_YUYV422:
638 c->chrToYV12 = yuy2ToUV_c;
640 case PIX_FMT_UYVY422:
641 c->chrToYV12 = uyvyToUV_c;
644 c->chrToYV12 = nv12ToUV_c;
647 c->chrToYV12 = nv21ToUV_c;
652 case PIX_FMT_BGR4_BYTE:
653 case PIX_FMT_RGB4_BYTE:
654 c->chrToYV12 = palToUV_c;
656 case PIX_FMT_GBRP9LE:
657 case PIX_FMT_GBRP10LE:
658 case PIX_FMT_GBRP16LE:
659 c->readChrPlanar = planar_rgb16le_to_uv;
661 case PIX_FMT_GBRP9BE:
662 case PIX_FMT_GBRP10BE:
663 case PIX_FMT_GBRP16BE:
664 c->readChrPlanar = planar_rgb16be_to_uv;
667 c->readChrPlanar = planar_rgb_to_uv;
670 case PIX_FMT_YUV444P9LE:
671 case PIX_FMT_YUV422P9LE:
672 case PIX_FMT_YUV420P9LE:
673 case PIX_FMT_YUV422P10LE:
674 case PIX_FMT_YUV444P10LE:
675 case PIX_FMT_YUV420P10LE:
676 case PIX_FMT_YUV420P16LE:
677 case PIX_FMT_YUV422P16LE:
678 case PIX_FMT_YUV444P16LE:
679 c->chrToYV12 = bswap16UV_c;
682 case PIX_FMT_YUV444P9BE:
683 case PIX_FMT_YUV422P9BE:
684 case PIX_FMT_YUV420P9BE:
685 case PIX_FMT_YUV444P10BE:
686 case PIX_FMT_YUV422P10BE:
687 case PIX_FMT_YUV420P10BE:
688 case PIX_FMT_YUV420P16BE:
689 case PIX_FMT_YUV422P16BE:
690 case PIX_FMT_YUV444P16BE:
691 c->chrToYV12 = bswap16UV_c;
695 if (c->chrSrcHSubSample) {
697 case PIX_FMT_RGB48BE:
698 c->chrToYV12 = rgb48BEToUV_half_c;
700 case PIX_FMT_RGB48LE:
701 c->chrToYV12 = rgb48LEToUV_half_c;
703 case PIX_FMT_BGR48BE:
704 c->chrToYV12 = bgr48BEToUV_half_c;
706 case PIX_FMT_BGR48LE:
707 c->chrToYV12 = bgr48LEToUV_half_c;
710 c->chrToYV12 = bgr32ToUV_half_c;
712 case PIX_FMT_RGB32_1:
713 c->chrToYV12 = bgr321ToUV_half_c;
716 c->chrToYV12 = bgr24ToUV_half_c;
718 case PIX_FMT_BGR565LE:
719 c->chrToYV12 = bgr16leToUV_half_c;
721 case PIX_FMT_BGR565BE:
722 c->chrToYV12 = bgr16beToUV_half_c;
724 case PIX_FMT_BGR555LE:
725 c->chrToYV12 = bgr15leToUV_half_c;
727 case PIX_FMT_BGR555BE:
728 c->chrToYV12 = bgr15beToUV_half_c;
730 case PIX_FMT_BGR444LE:
731 c->chrToYV12 = bgr12leToUV_half_c;
733 case PIX_FMT_BGR444BE:
734 c->chrToYV12 = bgr12beToUV_half_c;
737 c->chrToYV12 = rgb32ToUV_half_c;
739 case PIX_FMT_BGR32_1:
740 c->chrToYV12 = rgb321ToUV_half_c;
743 c->chrToYV12 = rgb24ToUV_half_c;
745 case PIX_FMT_RGB565LE:
746 c->chrToYV12 = rgb16leToUV_half_c;
748 case PIX_FMT_RGB565BE:
749 c->chrToYV12 = rgb16beToUV_half_c;
751 case PIX_FMT_RGB555LE:
752 c->chrToYV12 = rgb15leToUV_half_c;
754 case PIX_FMT_RGB555BE:
755 c->chrToYV12 = rgb15beToUV_half_c;
757 case PIX_FMT_RGB444LE:
758 c->chrToYV12 = rgb12leToUV_half_c;
760 case PIX_FMT_RGB444BE:
761 c->chrToYV12 = rgb12beToUV_half_c;
766 case PIX_FMT_RGB48BE:
767 c->chrToYV12 = rgb48BEToUV_c;
769 case PIX_FMT_RGB48LE:
770 c->chrToYV12 = rgb48LEToUV_c;
772 case PIX_FMT_BGR48BE:
773 c->chrToYV12 = bgr48BEToUV_c;
775 case PIX_FMT_BGR48LE:
776 c->chrToYV12 = bgr48LEToUV_c;
779 c->chrToYV12 = bgr32ToUV_c;
781 case PIX_FMT_RGB32_1:
782 c->chrToYV12 = bgr321ToUV_c;
785 c->chrToYV12 = bgr24ToUV_c;
787 case PIX_FMT_BGR565LE:
788 c->chrToYV12 = bgr16leToUV_c;
790 case PIX_FMT_BGR565BE:
791 c->chrToYV12 = bgr16beToUV_c;
793 case PIX_FMT_BGR555LE:
794 c->chrToYV12 = bgr15leToUV_c;
796 case PIX_FMT_BGR555BE:
797 c->chrToYV12 = bgr15beToUV_c;
799 case PIX_FMT_BGR444LE:
800 c->chrToYV12 = bgr12leToUV_c;
802 case PIX_FMT_BGR444BE:
803 c->chrToYV12 = bgr12beToUV_c;
806 c->chrToYV12 = rgb32ToUV_c;
808 case PIX_FMT_BGR32_1:
809 c->chrToYV12 = rgb321ToUV_c;
812 c->chrToYV12 = rgb24ToUV_c;
814 case PIX_FMT_RGB565LE:
815 c->chrToYV12 = rgb16leToUV_c;
817 case PIX_FMT_RGB565BE:
818 c->chrToYV12 = rgb16beToUV_c;
820 case PIX_FMT_RGB555LE:
821 c->chrToYV12 = rgb15leToUV_c;
823 case PIX_FMT_RGB555BE:
824 c->chrToYV12 = rgb15beToUV_c;
826 case PIX_FMT_RGB444LE:
827 c->chrToYV12 = rgb12leToUV_c;
829 case PIX_FMT_RGB444BE:
830 c->chrToYV12 = rgb12beToUV_c;
838 case PIX_FMT_GBRP9LE:
839 case PIX_FMT_GBRP10LE:
840 case PIX_FMT_GBRP16LE:
841 c->readLumPlanar = planar_rgb16le_to_y;
843 case PIX_FMT_GBRP9BE:
844 case PIX_FMT_GBRP10BE:
845 case PIX_FMT_GBRP16BE:
846 c->readLumPlanar = planar_rgb16be_to_y;
849 c->readLumPlanar = planar_rgb_to_y;
852 case PIX_FMT_YUV444P9LE:
853 case PIX_FMT_YUV422P9LE:
854 case PIX_FMT_YUV420P9LE:
855 case PIX_FMT_YUV444P10LE:
856 case PIX_FMT_YUV422P10LE:
857 case PIX_FMT_YUV420P10LE:
858 case PIX_FMT_YUV420P16LE:
859 case PIX_FMT_YUV422P16LE:
860 case PIX_FMT_YUV444P16LE:
861 case PIX_FMT_GRAY16LE:
862 c->lumToYV12 = bswap16Y_c;
865 case PIX_FMT_YUV444P9BE:
866 case PIX_FMT_YUV422P9BE:
867 case PIX_FMT_YUV420P9BE:
868 case PIX_FMT_YUV444P10BE:
869 case PIX_FMT_YUV422P10BE:
870 case PIX_FMT_YUV420P10BE:
871 case PIX_FMT_YUV420P16BE:
872 case PIX_FMT_YUV422P16BE:
873 case PIX_FMT_YUV444P16BE:
874 case PIX_FMT_GRAY16BE:
875 c->lumToYV12 = bswap16Y_c;
878 case PIX_FMT_YUYV422:
880 c->lumToYV12 = yuy2ToY_c;
882 case PIX_FMT_UYVY422:
883 c->lumToYV12 = uyvyToY_c;
886 c->lumToYV12 = bgr24ToY_c;
888 case PIX_FMT_BGR565LE:
889 c->lumToYV12 = bgr16leToY_c;
891 case PIX_FMT_BGR565BE:
892 c->lumToYV12 = bgr16beToY_c;
894 case PIX_FMT_BGR555LE:
895 c->lumToYV12 = bgr15leToY_c;
897 case PIX_FMT_BGR555BE:
898 c->lumToYV12 = bgr15beToY_c;
900 case PIX_FMT_BGR444LE:
901 c->lumToYV12 = bgr12leToY_c;
903 case PIX_FMT_BGR444BE:
904 c->lumToYV12 = bgr12beToY_c;
907 c->lumToYV12 = rgb24ToY_c;
909 case PIX_FMT_RGB565LE:
910 c->lumToYV12 = rgb16leToY_c;
912 case PIX_FMT_RGB565BE:
913 c->lumToYV12 = rgb16beToY_c;
915 case PIX_FMT_RGB555LE:
916 c->lumToYV12 = rgb15leToY_c;
918 case PIX_FMT_RGB555BE:
919 c->lumToYV12 = rgb15beToY_c;
921 case PIX_FMT_RGB444LE:
922 c->lumToYV12 = rgb12leToY_c;
924 case PIX_FMT_RGB444BE:
925 c->lumToYV12 = rgb12beToY_c;
930 case PIX_FMT_BGR4_BYTE:
931 case PIX_FMT_RGB4_BYTE:
932 c->lumToYV12 = palToY_c;
934 case PIX_FMT_MONOBLACK:
935 c->lumToYV12 = monoblack2Y_c;
937 case PIX_FMT_MONOWHITE:
938 c->lumToYV12 = monowhite2Y_c;
941 c->lumToYV12 = bgr32ToY_c;
943 case PIX_FMT_RGB32_1:
944 c->lumToYV12 = bgr321ToY_c;
947 c->lumToYV12 = rgb32ToY_c;
949 case PIX_FMT_BGR32_1:
950 c->lumToYV12 = rgb321ToY_c;
952 case PIX_FMT_RGB48BE:
953 c->lumToYV12 = rgb48BEToY_c;
955 case PIX_FMT_RGB48LE:
956 c->lumToYV12 = rgb48LEToY_c;
958 case PIX_FMT_BGR48BE:
959 c->lumToYV12 = bgr48BEToY_c;
961 case PIX_FMT_BGR48LE:
962 c->lumToYV12 = bgr48LEToY_c;
969 c->alpToYV12 = rgbaToA_c;
973 c->alpToYV12 = abgrToA_c;
976 c->alpToYV12 = uyvyToY_c;