]> git.sesse.net Git - ffmpeg/blobdiff - libswscale/swscale.c
Fix a possible crash on 64 bit systems when the lumSrcPtr or chrSrcPtr
[ffmpeg] / libswscale / swscale.c
index 1b649f33d42bc975a3b9f59cb4ac69be971f4514..0c1f8f3f4578972a11c1e79de8959884a01e6150 100644 (file)
@@ -1,26 +1,28 @@
 /*
-    Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
-
-    This program is free software; you can redistribute it and/or modify
-    it under the terms of the GNU General Public License as published by
-    the Free Software Foundation; either version 2 of the License, or
-    (at your option) any later version.
-
-    This program is distributed in the hope that it will be useful,
-    but WITHOUT ANY WARRANTY; without even the implied warranty of
-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-    GNU General Public License for more details.
-
-    You should have received a copy of the GNU General Public License
-    along with this program; if not, write to the Free Software
-    Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
-
-    the C code (not assembly, mmx, ...) of the swscaler which has been written
-    by Michael Niedermayer can be used under the LGPL license too
-*/
+ * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
+ *
+ * the C code (not assembly, mmx, ...) of this file can be used
+ * under the LGPL license too
+ */
 
 /*
-  supported Input formats: YV12, I420/IYUV, YUY2, UYVY, BGR32, BGR24, BGR16, BGR15, RGB32, RGB24, Y8/Y800, YVU9/IF09
+  supported Input formats: YV12, I420/IYUV, YUY2, UYVY, BGR32, BGR24, BGR16, BGR15, RGB32, RGB24, Y8/Y800, YVU9/IF09, PAL8
   supported output formats: YV12, I420/IYUV, YUY2, UYVY, {BGR,RGB}{1,4,8,15,16,24,32}, Y8/Y800, YVU9/IF09
   {BGR,RGB}{1,4,8,15,16} support dithering
   
@@ -59,11 +61,6 @@ untested special converters
 #include <unistd.h>
 #include "config.h"
 #include <assert.h>
-#ifdef HAVE_MALLOC_H
-#include <malloc.h>
-#else
-#include <stdlib.h>
-#endif
 #ifdef HAVE_SYS_MMAN_H
 #include <sys/mman.h>
 #if defined(MAP_ANON) && !defined(MAP_ANONYMOUS)
@@ -107,13 +104,17 @@ untested special converters
 
 #define isSupportedIn(x)  ((x)==PIX_FMT_YUV420P || (x)==PIX_FMT_YUYV422 || (x)==PIX_FMT_UYVY422\
                        || (x)==PIX_FMT_RGB32|| (x)==PIX_FMT_BGR24|| (x)==PIX_FMT_BGR565|| (x)==PIX_FMT_BGR555\
-                       || (x)==PIX_FMT_BGR32|| (x)==PIX_FMT_RGB24\
+                       || (x)==PIX_FMT_BGR32|| (x)==PIX_FMT_RGB24|| (x)==PIX_FMT_RGB565|| (x)==PIX_FMT_RGB555\
                        || (x)==PIX_FMT_GRAY8 || (x)==PIX_FMT_YUV410P\
-                       || (x)==PIX_FMT_YUV444P || (x)==PIX_FMT_YUV422P || (x)==PIX_FMT_YUV411P)
+                       || (x)==PIX_FMT_GRAY16BE || (x)==PIX_FMT_GRAY16LE\
+                       || (x)==PIX_FMT_YUV444P || (x)==PIX_FMT_YUV422P || (x)==PIX_FMT_YUV411P\
+                       || (x)==PIX_FMT_PAL8 || (x)==PIX_FMT_BGR8 || (x)==PIX_FMT_RGB8\
+                        || (x)==PIX_FMT_BGR4_BYTE  || (x)==PIX_FMT_RGB4_BYTE)
 #define isSupportedOut(x) ((x)==PIX_FMT_YUV420P || (x)==PIX_FMT_YUYV422 || (x)==PIX_FMT_UYVY422\
                        || (x)==PIX_FMT_YUV444P || (x)==PIX_FMT_YUV422P || (x)==PIX_FMT_YUV411P\
                        || isRGB(x) || isBGR(x)\
                        || (x)==PIX_FMT_NV12 || (x)==PIX_FMT_NV21\
+                       || (x)==PIX_FMT_GRAY16BE || (x)==PIX_FMT_GRAY16LE\
                        || (x)==PIX_FMT_GRAY8 || (x)==PIX_FMT_YUV410P)
 #define isPacked(x)    ((x)==PIX_FMT_YUYV422 || (x)==PIX_FMT_UYVY422 ||isRGB(x) || isBGR(x))
 
@@ -145,7 +146,7 @@ add BGR4 output support
 write special BGR->BGR scaler
 */
 
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86) && defined (CONFIG_GPL)
 static uint64_t attribute_used __attribute__((aligned(8))) bF8=       0xF8F8F8F8F8F8F8F8LL;
 static uint64_t attribute_used __attribute__((aligned(8))) bFC=       0xFCFCFCFCFCFCFCFCLL;
 static uint64_t __attribute__((aligned(8))) w10=       0x0010001000100010LL;
@@ -191,7 +192,7 @@ static const uint64_t bgr2VCoeff  attribute_used __attribute__((aligned(8))) = 0
 static const uint64_t bgr2YOffset attribute_used __attribute__((aligned(8))) = 0x1010101010101010ULL;
 static const uint64_t bgr2UVOffset attribute_used __attribute__((aligned(8)))= 0x8080808080808080ULL;
 static const uint64_t w1111       attribute_used __attribute__((aligned(8))) = 0x0001000100010001ULL;
-#endif /* defined(ARCH_X86) || defined(ARCH_X86_64) */
+#endif /* defined(ARCH_X86) */
 
 // clipping helper table for C implementations:
 static unsigned char clip_table[768];
@@ -204,6 +205,12 @@ extern const uint8_t dither_8x8_32[8][8];
 extern const uint8_t dither_8x8_73[8][8];
 extern const uint8_t dither_8x8_220[8][8];
 
+static const char * sws_context_to_name(void * ptr) {
+    return "swscaler";
+}
+
+static AVClass sws_context_class = { "SWScaler", sws_context_to_name, NULL };
+
 char *sws_format_name(enum PixelFormat format)
 {
     switch (format) {
@@ -229,6 +236,10 @@ char *sws_format_name(enum PixelFormat format)
             return "rgb565";
         case PIX_FMT_RGB555:
             return "rgb555";
+        case PIX_FMT_GRAY16BE:
+            return "gray16be";
+        case PIX_FMT_GRAY16LE:
+            return "gray16le";
         case PIX_FMT_GRAY8:
             return "gray8";
         case PIX_FMT_MONOWHITE:
@@ -282,7 +293,7 @@ char *sws_format_name(enum PixelFormat format)
     }
 }
 
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86) && defined (CONFIG_GPL)
 void in_asm_used_var_warning_killer()
 {
  volatile int i= bF8+bFC+w10+
@@ -305,7 +316,7 @@ static inline void yuv2yuvXinC(int16_t *lumFilter, int16_t **lumSrc, int lumFilt
                for(j=0; j<lumFilterSize; j++)
                        val += lumSrc[j][i] * lumFilter[j];
 
-               dest[i]= FFMIN(FFMAX(val>>19, 0), 255);
+               dest[i]= av_clip_uint8(val>>19);
        }
 
        if(uDest != NULL)
@@ -320,8 +331,8 @@ static inline void yuv2yuvXinC(int16_t *lumFilter, int16_t **lumSrc, int lumFilt
                                v += chrSrc[j][i + 2048] * chrFilter[j];
                        }
 
-                       uDest[i]= FFMIN(FFMAX(u>>19, 0), 255);
-                       vDest[i]= FFMIN(FFMAX(v>>19, 0), 255);
+                       uDest[i]= av_clip_uint8(u>>19);
+                       vDest[i]= av_clip_uint8(v>>19);
                }
 }
 
@@ -338,7 +349,7 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                for(j=0; j<lumFilterSize; j++)
                        val += lumSrc[j][i] * lumFilter[j];
 
-               dest[i]= FFMIN(FFMAX(val>>19, 0), 255);
+               dest[i]= av_clip_uint8(val>>19);
        }
 
        if(uDest == NULL)
@@ -356,8 +367,8 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                                v += chrSrc[j][i + 2048] * chrFilter[j];
                        }
 
-                       uDest[2*i]= FFMIN(FFMAX(u>>19, 0), 255);
-                       uDest[2*i+1]= FFMIN(FFMAX(v>>19, 0), 255);
+                       uDest[2*i]= av_clip_uint8(u>>19);
+                       uDest[2*i+1]= av_clip_uint8(v>>19);
                }
        else
                for(i=0; i<chrDstW; i++)
@@ -371,8 +382,8 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                                v += chrSrc[j][i + 2048] * chrFilter[j];
                        }
 
-                       uDest[2*i]= FFMIN(FFMAX(v>>19, 0), 255);
-                       uDest[2*i+1]= FFMIN(FFMAX(u>>19, 0), 255);
+                       uDest[2*i]= av_clip_uint8(v>>19);
+                       uDest[2*i+1]= av_clip_uint8(u>>19);
                }
 }
 
@@ -383,7 +394,7 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                        int Y2=1<<18;\
                        int U=1<<18;\
                        int V=1<<18;\
-                       type *r, *b, *g;\
+                       type attribute_unused *r, *b, *g;\
                        const int i2= 2*i;\
                        \
                        for(j=0; j<lumFilterSize; j++)\
@@ -414,9 +425,9 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                         
 #define YSCALE_YUV_2_RGBX_C(type) \
                        YSCALE_YUV_2_PACKEDX_C(type)\
-                       r = c->table_rV[V];\
-                       g = c->table_gU[U] + c->table_gV[V];\
-                       b = c->table_bU[U];\
+                       r = (type *)c->table_rV[V];\
+                       g = (type *)(c->table_gU[U] + c->table_gV[V]);\
+                       b = (type *)c->table_bU[U];\
 
 #define YSCALE_YUV_2_PACKED2_C \
                for(i=0; i<(dstW>>1); i++){\
@@ -429,9 +440,9 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
 #define YSCALE_YUV_2_RGB2_C(type) \
                        YSCALE_YUV_2_PACKED2_C\
                        type *r, *b, *g;\
-                       r = c->table_rV[V];\
-                       g = c->table_gU[U] + c->table_gV[V];\
-                       b = c->table_bU[U];\
+                       r = (type *)c->table_rV[V];\
+                       g = (type *)(c->table_gU[U] + c->table_gV[V]);\
+                       b = (type *)c->table_bU[U];\
 
 #define YSCALE_YUV_2_PACKED1_C \
                for(i=0; i<(dstW>>1); i++){\
@@ -444,9 +455,9 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
 #define YSCALE_YUV_2_RGB1_C(type) \
                        YSCALE_YUV_2_PACKED1_C\
                        type *r, *b, *g;\
-                       r = c->table_rV[V];\
-                       g = c->table_gU[U] + c->table_gV[V];\
-                       b = c->table_bU[U];\
+                       r = (type *)c->table_rV[V];\
+                       g = (type *)(c->table_gU[U] + c->table_gV[V]);\
+                       b = (type *)c->table_bU[U];\
 
 #define YSCALE_YUV_2_PACKED1B_C \
                for(i=0; i<(dstW>>1); i++){\
@@ -459,9 +470,9 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
 #define YSCALE_YUV_2_RGB1B_C(type) \
                        YSCALE_YUV_2_PACKED1B_C\
                        type *r, *b, *g;\
-                       r = c->table_rV[V];\
-                       g = c->table_gU[U] + c->table_gV[V];\
-                       b = c->table_bU[U];\
+                       r = (type *)c->table_rV[V];\
+                       g = (type *)(c->table_gU[U] + c->table_gV[V]);\
+                       b = (type *)c->table_bU[U];\
 
 #define YSCALE_YUV_2_ANYRGB_C(func, func2)\
        switch(c->dstFormat)\
@@ -601,8 +612,8 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
                                        + (last_new[y][i] - in3)*f/256;\
                                int new= old> 128 ? 255 : 0;\
 \
-                               error_new+= ABS(last_new[y][i] - new);\
-                               error_in3+= ABS(last_in3[y][i] - in3);\
+                               error_new+= FFABS(last_new[y][i] - new);\
+                               error_in3+= FFABS(last_in3[y][i] - in3);\
                                f= error_new - error_in3*4;\
                                if(f<0) f=0;\
                                if(f>256) f=256;\
@@ -795,27 +806,27 @@ static inline void yuv2packedXinC(SwsContext *c, int16_t *lumFilter, int16_t **l
 
 //Note: we have C, X86, MMX, MMX2, 3DNOW version therse no 3DNOW+MMX2 one
 //Plain C versions
-#if !defined (HAVE_MMX) || defined (RUNTIME_CPUDETECT)
+#if !defined (HAVE_MMX) || defined (RUNTIME_CPUDETECT) || !defined(CONFIG_GPL)
 #define COMPILE_C
 #endif
 
 #ifdef ARCH_POWERPC
-#if defined (HAVE_ALTIVEC) || defined (RUNTIME_CPUDETECT)
+#if (defined (HAVE_ALTIVEC) || defined (RUNTIME_CPUDETECT)) && defined (CONFIG_GPL)
 #define COMPILE_ALTIVEC
 #endif //HAVE_ALTIVEC
 #endif //ARCH_POWERPC
 
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86)
 
-#if (defined (HAVE_MMX) && !defined (HAVE_3DNOW) && !defined (HAVE_MMX2)) || defined (RUNTIME_CPUDETECT)
+#if ((defined (HAVE_MMX) && !defined (HAVE_3DNOW) && !defined (HAVE_MMX2)) || defined (RUNTIME_CPUDETECT)) && defined (CONFIG_GPL)
 #define COMPILE_MMX
 #endif
 
-#if defined (HAVE_MMX2) || defined (RUNTIME_CPUDETECT)
+#if (defined (HAVE_MMX2) || defined (RUNTIME_CPUDETECT)) && defined (CONFIG_GPL)
 #define COMPILE_MMX2
 #endif
 
-#if (defined (HAVE_3DNOW) && !defined (HAVE_MMX2)) || defined (RUNTIME_CPUDETECT)
+#if ((defined (HAVE_3DNOW) && !defined (HAVE_MMX2)) || defined (RUNTIME_CPUDETECT)) && defined (CONFIG_GPL)
 #define COMPILE_3DNOW
 #endif
 #endif //ARCH_X86 || ARCH_X86_64
@@ -842,7 +853,7 @@ static inline void yuv2packedXinC(SwsContext *c, int16_t *lumFilter, int16_t **l
 #endif
 #endif //ARCH_POWERPC
 
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86)
 
 //X86 versions
 /*
@@ -909,7 +920,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
        int minFilterSize;
        double *filter=NULL;
        double *filter2=NULL;
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86)
        if(flags & SWS_CPU_CAPS_MMX)
                asm volatile("emms\n\t"::: "memory"); //FIXME this shouldnt be required but it IS (even for non mmx versions)
 #endif
@@ -917,7 +928,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
        // Note the +1 is for the MMXscaler which reads over the end
        *filterPos = av_malloc((dstW+1)*sizeof(int16_t));
 
-       if(ABS(xInc - 0x10000) <10) // unscaled
+       if(FFABS(xInc - 0x10000) <10) // unscaled
        {
                int i;
                filterSize= 1;
@@ -967,7 +978,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
                                //Bilinear upscale / linear interpolate / Area averaging
                                for(j=0; j<filterSize; j++)
                                {
-                                       double d= ABS((xx<<16) - xDstInSrc)/(double)(1<<16);
+                                       double d= FFABS((xx<<16) - xDstInSrc)/(double)(1<<16);
                                        double coeff= 1.0 - d;
                                        if(coeff<0) coeff=0;
                                        filter[i*filterSize + j]= coeff;
@@ -1011,7 +1022,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
                        (*filterPos)[i]= xx;
                        for(j=0; j<filterSize; j++)
                        {
-                               double d= ABS(xx - xDstInSrc)/filterSizeInSrc*sizeFactor;
+                               double d= FFABS(xx - xDstInSrc)/filterSizeInSrc*sizeFactor;
                                double coeff;
                                if(flags & SWS_BICUBIC)
                                {
@@ -1136,7 +1147,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
                for(j=0; j<filter2Size; j++)
                {
                        int k;
-                       cutOff += ABS(filter2[i*filter2Size]);
+                       cutOff += FFABS(filter2[i*filter2Size]);
 
                        if(cutOff > SWS_MAX_REDUCE_CUTOFF) break;
 
@@ -1154,7 +1165,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
                /* count near zeros on the right */
                for(j=filter2Size-1; j>0; j--)
                {
-                       cutOff += ABS(filter2[i*filter2Size + j]);
+                       cutOff += FFABS(filter2[i*filter2Size + j]);
 
                        if(cutOff > SWS_MAX_REDUCE_CUTOFF) break;
                        min--;
@@ -1193,7 +1204,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
        *outFilterSize= filterSize;
 
        if(flags&SWS_PRINT_INFO)
-               MSG_V("SwScaler: reducing / aligning filtersize %d -> %d\n", filter2Size, filterSize);
+               av_log(NULL, AV_LOG_VERBOSE, "SwScaler: reducing / aligning filtersize %d -> %d\n", filter2Size, filterSize);
        /* try to reduce the filter-size (step2 reduce it) */
        for(i=0; i<dstW; i++)
        {
@@ -1242,8 +1253,7 @@ static inline int initFilter(int16_t **outFilter, int16_t **filterPos, int *outF
 
        // Note the +1 is for the MMXscaler which reads over the end
        /* align at 16 for AltiVec (needed by hScale_altivec_real) */
-       *outFilter= av_malloc(*outFilterSize*(dstW+1)*sizeof(int16_t));
-       memset(*outFilter, 0, *outFilterSize*(dstW+1)*sizeof(int16_t));
+       *outFilter= av_mallocz(*outFilterSize*(dstW+1)*sizeof(int16_t));
 
        /* Normalize & Store in outFilter */
        for(i=0; i<dstW; i++)
@@ -1455,15 +1465,15 @@ static void globalInit(void){
     // generating tables:
     int i;
     for(i=0; i<768; i++){
-       int c= FFMIN(FFMAX(i-256, 0), 255);
+       int c= av_clip_uint8(i-256);
        clip_table[i]=c;
     }
 }
 
 static SwsFunc getSwsFunc(int flags){
     
-#ifdef RUNTIME_CPUDETECT
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(RUNTIME_CPUDETECT) && defined (CONFIG_GPL)
+#if defined(ARCH_X86)
        // ordered per speed fasterst first
        if(flags & SWS_CPU_CAPS_MMX2)
                return swScale_MMX2;
@@ -1482,7 +1492,7 @@ static SwsFunc getSwsFunc(int flags){
          return swScale_C;
 #endif
        return swScale_C;
-#endif /* defined(ARCH_X86) || defined(ARCH_X86_64) */
+#endif /* defined(ARCH_X86) */
 #else //RUNTIME_CPUDETECT
 #ifdef HAVE_MMX2
        return swScale_MMX2;
@@ -1570,7 +1580,7 @@ static int rgb2rgbWrapper(SwsContext *c, uint8_t* src[], int srcStride[], int sr
                case 0x83: conv= rgb15to32; break;
                case 0x84: conv= rgb16to32; break;
                case 0x86: conv= rgb24to32; break;
-               default: MSG_ERR("swScaler: internal error %s -> %s converter\n", 
+               default: av_log(c, AV_LOG_ERROR, "swScaler: internal error %s -> %s converter\n", 
                                 sws_format_name(srcFormat), sws_format_name(dstFormat)); break;
                }
        }else if(   (isBGR(srcFormat) && isRGB(dstFormat))
@@ -1592,11 +1602,11 @@ static int rgb2rgbWrapper(SwsContext *c, uint8_t* src[], int srcStride[], int sr
                case 0x84: conv= rgb16tobgr32; break;
                case 0x86: conv= rgb24tobgr32; break;
                case 0x88: conv= rgb32tobgr32; break;
-               default: MSG_ERR("swScaler: internal error %s -> %s converter\n", 
+               default: av_log(c, AV_LOG_ERROR, "swScaler: internal error %s -> %s converter\n", 
                                 sws_format_name(srcFormat), sws_format_name(dstFormat)); break;
                }
        }else{
-               MSG_ERR("swScaler: internal error %s -> %s converter\n", 
+               av_log(c, AV_LOG_ERROR, "swScaler: internal error %s -> %s converter\n", 
                         sws_format_name(srcFormat), sws_format_name(dstFormat));
        }
 
@@ -1676,8 +1686,8 @@ static int simpleCopy(SwsContext *c, uint8_t* src[], int srcStride[], int srcSli
                        int length=0;
 
                        /* universal length finder */
-                       while(length+c->srcW <= ABS(dstStride[0]) 
-                          && length+c->srcW <= ABS(srcStride[0])) length+= c->srcW;
+                       while(length+c->srcW <= FFABS(dstStride[0]) 
+                          && length+c->srcW <= FFABS(srcStride[0])) length+= c->srcW;
                        ASSERT(length!=0);
 
                        for(i=0; i<srcSliceH; i++)
@@ -1724,6 +1734,72 @@ static int simpleCopy(SwsContext *c, uint8_t* src[], int srcStride[], int srcSli
        return srcSliceH;
 }
 
+static int gray16togray(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
+             int srcSliceH, uint8_t* dst[], int dstStride[]){
+
+       int length= c->srcW;
+       int y=      srcSliceY;
+       int height= srcSliceH;
+       int i, j;
+       uint8_t *srcPtr= src[0];
+       uint8_t *dstPtr= dst[0] + dstStride[0]*y;
+
+       if(!isGray(c->dstFormat)){
+               int height= -((-srcSliceH)>>c->chrDstVSubSample);
+               memset(dst[1], 128, dstStride[1]*height);
+               memset(dst[2], 128, dstStride[2]*height);
+       }
+       if(c->srcFormat == PIX_FMT_GRAY16LE) srcPtr++;
+       for(i=0; i<height; i++)
+       {
+               for(j=0; j<length; j++) dstPtr[j] = srcPtr[j<<1];
+               srcPtr+= srcStride[0];
+               dstPtr+= dstStride[0];
+       }
+       return srcSliceH;
+}
+
+static int graytogray16(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
+             int srcSliceH, uint8_t* dst[], int dstStride[]){
+
+       int length= c->srcW;
+       int y=      srcSliceY;
+       int height= srcSliceH;
+       int i, j;
+       uint8_t *srcPtr= src[0];
+       uint8_t *dstPtr= dst[0] + dstStride[0]*y;
+       for(i=0; i<height; i++)
+       {
+               for(j=0; j<length; j++)
+               {
+                       dstPtr[j<<1] = srcPtr[j];
+                       dstPtr[(j<<1)+1] = srcPtr[j];
+               }
+               srcPtr+= srcStride[0];
+               dstPtr+= dstStride[0];
+       }
+       return srcSliceH;
+}
+
+static int gray16swap(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
+             int srcSliceH, uint8_t* dst[], int dstStride[]){
+
+       int length= c->srcW;
+       int y=      srcSliceY;
+       int height= srcSliceH;
+       int i, j;
+       uint16_t *srcPtr= src[0];
+       uint16_t *dstPtr= dst[0] + dstStride[0]*y/2;
+       for(i=0; i<height; i++)
+       {
+               for(j=0; j<length; j++) dstPtr[j] = bswap_16(srcPtr[j]);
+               srcPtr+= srcStride[0]/2;
+               dstPtr+= dstStride[0]/2;
+       }
+       return srcSliceH;
+}
+
+
 static void getSubSampleFactors(int *h, int *v, int format){
        switch(format){
        case PIX_FMT_UYVY422:
@@ -1732,6 +1808,8 @@ static void getSubSampleFactors(int *h, int *v, int format){
                *v=0;
                break;
        case PIX_FMT_YUV420P:
+       case PIX_FMT_GRAY16BE:
+       case PIX_FMT_GRAY16LE:
        case PIX_FMT_GRAY8: //FIXME remove after different subsamplings are fully implemented
        case PIX_FMT_NV12:
        case PIX_FMT_NV21:
@@ -1867,12 +1945,12 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
        int unscaled, needsDither;
        int srcRange, dstRange;
        SwsFilter dummyFilter= {NULL, NULL, NULL, NULL};
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86)
        if(flags & SWS_CPU_CAPS_MMX)
                asm volatile("emms\n\t"::: "memory");
 #endif
 
-#ifndef RUNTIME_CPUDETECT //ensure that the flags match the compiled variant if cpudetect is off
+#if !defined(RUNTIME_CPUDETECT) || !defined (CONFIG_GPL) //ensure that the flags match the compiled variant if cpudetect is off
        flags &= ~(SWS_CPU_CAPS_MMX|SWS_CPU_CAPS_MMX2|SWS_CPU_CAPS_3DNOW|SWS_CPU_CAPS_ALTIVEC);
 #ifdef HAVE_MMX2
        flags |= SWS_CPU_CAPS_MMX|SWS_CPU_CAPS_MMX2;
@@ -1897,19 +1975,19 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
 
        if(!isSupportedIn(srcFormat)) 
        {
-               MSG_ERR("swScaler: %s is not supported as input format\n", sws_format_name(srcFormat));
+               av_log(NULL, AV_LOG_ERROR, "swScaler: %s is not supported as input format\n", sws_format_name(srcFormat));
                return NULL;
        }
        if(!isSupportedOut(dstFormat))
        {
-               MSG_ERR("swScaler: %s is not supported as output format\n", sws_format_name(dstFormat));
+               av_log(NULL, AV_LOG_ERROR, "swScaler: %s is not supported as output format\n", sws_format_name(dstFormat));
                return NULL;
        }
 
        /* sanity check */
        if(srcW<4 || srcH<1 || dstW<8 || dstH<1) //FIXME check if these are enough and try to lowwer them after fixing the relevant parts of the code
        {
-                MSG_ERR("swScaler: %dx%d -> %dx%d is invalid scaling dimension\n", 
+                av_log(NULL, AV_LOG_ERROR, "swScaler: %dx%d -> %dx%d is invalid scaling dimension\n", 
                        srcW, srcH, dstW, dstH);
                return NULL;
        }
@@ -1917,9 +1995,9 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
        if(!dstFilter) dstFilter= &dummyFilter;
        if(!srcFilter) srcFilter= &dummyFilter;
 
-       c= av_malloc(sizeof(SwsContext));
-       memset(c, 0, sizeof(SwsContext));
+       c= av_mallocz(sizeof(SwsContext));
 
+       c->av_class = &sws_context_class;
        c->srcW= srcW;
        c->srcH= srcH;
        c->dstW= dstW;
@@ -1982,11 +2060,13 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
                {
                        c->swScale= PlanarToNV12Wrapper;
                }
+#ifdef CONFIG_GPL
                /* yuv2bgr */
                if((srcFormat==PIX_FMT_YUV420P || srcFormat==PIX_FMT_YUV422P) && (isBGR(dstFormat) || isRGB(dstFormat)))
                {
                        c->swScale= yuv2rgb_get_func_ptr(c);
                }
+#endif
                
                if( srcFormat==PIX_FMT_YUV410P && dstFormat==PIX_FMT_YUV420P )
                {
@@ -2043,9 +2123,23 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
                        c->swScale= simpleCopy;
                }
 
+               /* gray16{le,be} conversions */
+               if(isGray16(srcFormat) && (isPlanarYUV(dstFormat) || (dstFormat == PIX_FMT_GRAY8)))
+               {
+                       c->swScale= gray16togray;
+               }
+               if((isPlanarYUV(srcFormat) || (srcFormat == PIX_FMT_GRAY8)) && isGray16(dstFormat))
+               {
+                       c->swScale= graytogray16;
+               }
+               if(srcFormat != dstFormat && isGray16(srcFormat) && isGray16(dstFormat))
+               {
+                       c->swScale= gray16swap;
+               }               
+
                if(c->swScale){
                        if(flags&SWS_PRINT_INFO)
-                               MSG_INFO("SwScaler: using unscaled %s -> %s special converter\n", 
+                               av_log(c, AV_LOG_INFO, "SwScaler: using unscaled %s -> %s special converter\n", 
                                        sws_format_name(srcFormat), sws_format_name(dstFormat));
                        return c;
                }
@@ -2057,7 +2151,7 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
                if(!c->canMMX2BeUsed && dstW >=srcW && (srcW&15)==0 && (flags&SWS_FAST_BILINEAR))
                {
                        if(flags&SWS_PRINT_INFO)
-                               MSG_INFO("SwScaler: output Width is not a multiple of 32 -> no MMX2 scaler\n");
+                               av_log(c, AV_LOG_INFO, "SwScaler: output Width is not a multiple of 32 -> no MMX2 scaler\n");
                }
                if(usesHFilter) c->canMMX2BeUsed=0;
        }
@@ -2189,12 +2283,11 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
        //Note we need at least one pixel more at the end because of the mmx code (just in case someone wanna replace the 4000/8000)
        /* align at 16 bytes for AltiVec */
        for(i=0; i<c->vLumBufSize; i++)
-               c->lumPixBuf[i]= c->lumPixBuf[i+c->vLumBufSize]= av_malloc(4000);
+               c->lumPixBuf[i]= c->lumPixBuf[i+c->vLumBufSize]= av_mallocz(4000);
        for(i=0; i<c->vChrBufSize; i++)
                c->chrPixBuf[i]= c->chrPixBuf[i+c->vChrBufSize]= av_malloc(8000);
 
        //try to avoid drawing green stuff between the right end and the stride end
-       for(i=0; i<c->vLumBufSize; i++) memset(c->lumPixBuf[i], 0, 4000);
        for(i=0; i<c->vChrBufSize; i++) memset(c->chrPixBuf[i], 64, 8000);
 
        ASSERT(c->chrDstH <= dstH)
@@ -2207,47 +2300,47 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
                char *dither= "";
 #endif
                if(flags&SWS_FAST_BILINEAR)
-                       MSG_INFO("\nSwScaler: FAST_BILINEAR scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: FAST_BILINEAR scaler, ");
                else if(flags&SWS_BILINEAR)
-                       MSG_INFO("\nSwScaler: BILINEAR scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: BILINEAR scaler, ");
                else if(flags&SWS_BICUBIC)
-                       MSG_INFO("\nSwScaler: BICUBIC scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: BICUBIC scaler, ");
                else if(flags&SWS_X)
-                       MSG_INFO("\nSwScaler: Experimental scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Experimental scaler, ");
                else if(flags&SWS_POINT)
-                       MSG_INFO("\nSwScaler: Nearest Neighbor / POINT scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Nearest Neighbor / POINT scaler, ");
                else if(flags&SWS_AREA)
-                       MSG_INFO("\nSwScaler: Area Averageing scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Area Averageing scaler, ");
                else if(flags&SWS_BICUBLIN)
-                       MSG_INFO("\nSwScaler: luma BICUBIC / chroma BILINEAR scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: luma BICUBIC / chroma BILINEAR scaler, ");
                else if(flags&SWS_GAUSS)
-                       MSG_INFO("\nSwScaler: Gaussian scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Gaussian scaler, ");
                else if(flags&SWS_SINC)
-                       MSG_INFO("\nSwScaler: Sinc scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Sinc scaler, ");
                else if(flags&SWS_LANCZOS)
-                       MSG_INFO("\nSwScaler: Lanczos scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Lanczos scaler, ");
                else if(flags&SWS_SPLINE)
-                       MSG_INFO("\nSwScaler: Bicubic spline scaler, ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: Bicubic spline scaler, ");
                else
-                       MSG_INFO("\nSwScaler: ehh flags invalid?! ");
+                       av_log(c, AV_LOG_INFO, "SwScaler: ehh flags invalid?! ");
 
                if(dstFormat==PIX_FMT_BGR555 || dstFormat==PIX_FMT_BGR565)
-                       MSG_INFO("from %s to%s %s ", 
+                       av_log(c, AV_LOG_INFO, "from %s to%s %s ", 
                                sws_format_name(srcFormat), dither, sws_format_name(dstFormat));
                else
-                       MSG_INFO("from %s to %s ", 
+                       av_log(c, AV_LOG_INFO, "from %s to %s ", 
                                sws_format_name(srcFormat), sws_format_name(dstFormat));
 
                if(flags & SWS_CPU_CAPS_MMX2)
-                       MSG_INFO("using MMX2\n");
+                       av_log(c, AV_LOG_INFO, "using MMX2\n");
                else if(flags & SWS_CPU_CAPS_3DNOW)
-                       MSG_INFO("using 3DNOW\n");
+                       av_log(c, AV_LOG_INFO, "using 3DNOW\n");
                else if(flags & SWS_CPU_CAPS_MMX)
-                       MSG_INFO("using MMX\n");
+                       av_log(c, AV_LOG_INFO, "using MMX\n");
                else if(flags & SWS_CPU_CAPS_ALTIVEC)
-                       MSG_INFO("using AltiVec\n");
+                       av_log(c, AV_LOG_INFO, "using AltiVec\n");
                else 
-                       MSG_INFO("using C\n");
+                       av_log(c, AV_LOG_INFO, "using C\n");
        }
 
        if(flags & SWS_PRINT_INFO)
@@ -2255,70 +2348,70 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
                if(flags & SWS_CPU_CAPS_MMX)
                {
                        if(c->canMMX2BeUsed && (flags&SWS_FAST_BILINEAR))
-                               MSG_V("SwScaler: using FAST_BILINEAR MMX2 scaler for horizontal scaling\n");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using FAST_BILINEAR MMX2 scaler for horizontal scaling\n");
                        else
                        {
                                if(c->hLumFilterSize==4)
-                                       MSG_V("SwScaler: using 4-tap MMX scaler for horizontal luminance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using 4-tap MMX scaler for horizontal luminance scaling\n");
                                else if(c->hLumFilterSize==8)
-                                       MSG_V("SwScaler: using 8-tap MMX scaler for horizontal luminance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using 8-tap MMX scaler for horizontal luminance scaling\n");
                                else
-                                       MSG_V("SwScaler: using n-tap MMX scaler for horizontal luminance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using n-tap MMX scaler for horizontal luminance scaling\n");
 
                                if(c->hChrFilterSize==4)
-                                       MSG_V("SwScaler: using 4-tap MMX scaler for horizontal chrominance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using 4-tap MMX scaler for horizontal chrominance scaling\n");
                                else if(c->hChrFilterSize==8)
-                                       MSG_V("SwScaler: using 8-tap MMX scaler for horizontal chrominance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using 8-tap MMX scaler for horizontal chrominance scaling\n");
                                else
-                                       MSG_V("SwScaler: using n-tap MMX scaler for horizontal chrominance scaling\n");
+                                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using n-tap MMX scaler for horizontal chrominance scaling\n");
                        }
                }
                else
                {
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
-                       MSG_V("SwScaler: using X86-Asm scaler for horizontal scaling\n");
+#if defined(ARCH_X86)
+                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using X86-Asm scaler for horizontal scaling\n");
 #else
                        if(flags & SWS_FAST_BILINEAR)
-                               MSG_V("SwScaler: using FAST_BILINEAR C scaler for horizontal scaling\n");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using FAST_BILINEAR C scaler for horizontal scaling\n");
                        else
-                               MSG_V("SwScaler: using C scaler for horizontal scaling\n");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using C scaler for horizontal scaling\n");
 #endif
                }
                if(isPlanarYUV(dstFormat))
                {
                        if(c->vLumFilterSize==1)
-                               MSG_V("SwScaler: using 1-tap %s \"scaler\" for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using 1-tap %s \"scaler\" for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                        else
-                               MSG_V("SwScaler: using n-tap %s scaler for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using n-tap %s scaler for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                }
                else
                {
                        if(c->vLumFilterSize==1 && c->vChrFilterSize==2)
-                               MSG_V("SwScaler: using 1-tap %s \"scaler\" for vertical luminance scaling (BGR)\n"
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using 1-tap %s \"scaler\" for vertical luminance scaling (BGR)\n"
                                       "SwScaler:       2-tap scaler for vertical chrominance scaling (BGR)\n",(flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                        else if(c->vLumFilterSize==2 && c->vChrFilterSize==2)
-                               MSG_V("SwScaler: using 2-tap linear %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using 2-tap linear %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                        else
-                               MSG_V("SwScaler: using n-tap %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                               av_log(c, AV_LOG_VERBOSE, "SwScaler: using n-tap %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                }
 
                if(dstFormat==PIX_FMT_BGR24)
-                       MSG_V("SwScaler: using %s YV12->BGR24 Converter\n",
+                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using %s YV12->BGR24 Converter\n",
                                (flags & SWS_CPU_CAPS_MMX2) ? "MMX2" : ((flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C"));
                else if(dstFormat==PIX_FMT_RGB32)
-                       MSG_V("SwScaler: using %s YV12->BGR32 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using %s YV12->BGR32 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                else if(dstFormat==PIX_FMT_BGR565)
-                       MSG_V("SwScaler: using %s YV12->BGR16 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using %s YV12->BGR16 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
                else if(dstFormat==PIX_FMT_BGR555)
-                       MSG_V("SwScaler: using %s YV12->BGR15 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
+                       av_log(c, AV_LOG_VERBOSE, "SwScaler: using %s YV12->BGR15 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");
 
-               MSG_V("SwScaler: %dx%d -> %dx%d\n", srcW, srcH, dstW, dstH);
+               av_log(c, AV_LOG_VERBOSE, "SwScaler: %dx%d -> %dx%d\n", srcW, srcH, dstW, dstH);
        }
        if(flags & SWS_PRINT_INFO)
        {
-               MSG_DBG2("SwScaler:Lum srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",
+               av_log(c, AV_LOG_DEBUG, "SwScaler:Lum srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",
                        c->srcW, c->srcH, c->dstW, c->dstH, c->lumXInc, c->lumYInc);
-               MSG_DBG2("SwScaler:Chr srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",
+               av_log(c, AV_LOG_DEBUG, "SwScaler:Chr srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",
                        c->chrSrcW, c->chrSrcH, c->chrDstW, c->chrDstH, c->chrXInc, c->chrYInc);
        }
 
@@ -2330,10 +2423,10 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
  * swscale warper, so we don't need to export the SwsContext.
  * assumes planar YUV to be in YUV order instead of YVU
  */
-int sws_scale_ordered(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
+int sws_scale(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
                            int srcSliceH, uint8_t* dst[], int dstStride[]){
        if (c->sliceDir == 0 && srcSliceY != 0 && srcSliceY + srcSliceH != c->srcH) {
-           MSG_ERR("swScaler: slices start in the middle!\n");
+           av_log(c, AV_LOG_ERROR, "swScaler: slices start in the middle!\n");
            return 0;
        }
        if (c->sliceDir == 0) {
@@ -2365,15 +2458,9 @@ int sws_scale_ordered(SwsContext *c, uint8_t* src[], int srcStride[], int srcSli
 /**
  * swscale warper, so we don't need to export the SwsContext
  */
-int sws_scale(SwsContext *c, uint8_t* srcParam[], int srcStride[], int srcSliceY,
-                           int srcSliceH, uint8_t* dstParam[], int dstStride[]){
-       uint8_t *src[3];
-       uint8_t *dst[3];
-       src[0] = srcParam[0]; src[1] = srcParam[1]; src[2] = srcParam[2];
-       dst[0] = dstParam[0]; dst[1] = dstParam[1]; dst[2] = dstParam[2];
-//printf("sws: slice %d %d\n", srcSliceY, srcSliceH);
-
-       return c->swScale(c, src, srcStride, srcSliceY, srcSliceH, dst, dstStride);
+int sws_scale_ordered(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,
+                           int srcSliceH, uint8_t* dst[], int dstStride[]){
+       return sws_scale(c, src, srcStride, srcSliceY, srcSliceH, dst, dstStride);
 }
 
 SwsFilter *sws_getDefaultFilter(float lumaGBlur, float chromaGBlur, 
@@ -2557,7 +2644,7 @@ static SwsVector *sws_diffVec(SwsVector *a, SwsVector *b){
 
 /* shift left / or right if "shift" is negative */
 static SwsVector *sws_getShiftedVec(SwsVector *a, int shift){
-       int length= a->length + ABS(shift)*2;
+       int length= a->length + FFABS(shift)*2;
        double *coeff= av_malloc(length*sizeof(double));
        int i;
        SwsVector *vec= av_malloc(sizeof(SwsVector));
@@ -2637,9 +2724,9 @@ void sws_printVec(SwsVector *a){
        for(i=0; i<a->length; i++)
        {
                int x= (int)((a->coeff[i]-min)*60.0/range +0.5);
-               MSG_DBG2("%1.3f ", a->coeff[i]);
-               for(;x>0; x--) MSG_DBG2(" ");
-               MSG_DBG2("|\n");
+               av_log(NULL, AV_LOG_DEBUG, "%1.3f ", a->coeff[i]);
+               for(;x>0; x--) av_log(NULL, AV_LOG_DEBUG, " ");
+               av_log(NULL, AV_LOG_DEBUG, "|\n");
        }
 }
 
@@ -2712,7 +2799,7 @@ void sws_freeContext(SwsContext *c){
        av_free(c->hChrFilterPos);
        c->hChrFilterPos = NULL;
 
-#if defined(ARCH_X86) || defined(ARCH_X86_64)
+#if defined(ARCH_X86) && defined(CONFIG_GPL)
 #ifdef MAP_ANONYMOUS
        if(c->funnyYCode) munmap(c->funnyYCode, MAX_FUNNY_CODE_SIZE);
        if(c->funnyUVCode) munmap(c->funnyUVCode, MAX_FUNNY_CODE_SIZE);
@@ -2722,7 +2809,7 @@ void sws_freeContext(SwsContext *c){
 #endif
        c->funnyYCode=NULL;
        c->funnyUVCode=NULL;
-#endif /* defined(ARCH_X86) || defined(ARCH_X86_64) */
+#endif /* defined(ARCH_X86) */
 
        av_free(c->lumMmx2Filter);
        c->lumMmx2Filter=NULL;