#undef HAVE_AV_CONFIG_H
#include "libavutil/avutil.h"
+#include "libavutil/lfg.h"
#include "swscale.h"
-#include "swscale_internal.h"
-#include "rgb2rgb.h"
-static uint64_t getSSD(uint8_t *src1, uint8_t *src2, int stride1, int stride2, int w, int h){
+/* HACK Duplicated from swscale_internal.h.
+ * Should be removed when a cleaner pixel format system exists. */
+const char *sws_format_name(enum PixelFormat format);
+#define isGray(x) ( \
+ (x)==PIX_FMT_GRAY8 \
+ || (x)==PIX_FMT_GRAY16BE \
+ || (x)==PIX_FMT_GRAY16LE \
+ )
+#define hasChroma(x) (!( \
+ isGray(x) \
+ || (x)==PIX_FMT_MONOBLACK \
+ || (x)==PIX_FMT_MONOWHITE \
+ ))
+#define isALPHA(x) ( \
+ (x)==PIX_FMT_BGR32 \
+ || (x)==PIX_FMT_BGR32_1 \
+ || (x)==PIX_FMT_RGB32 \
+ || (x)==PIX_FMT_RGB32_1 \
+ || (x)==PIX_FMT_YUVA420P \
+ )
+
+static uint64_t getSSD(uint8_t *src1, uint8_t *src2, int stride1, int stride2, int w, int h)
+{
int x,y;
uint64_t ssd=0;
//printf("%d %d\n", w, h);
- for (y=0; y<h; y++){
- for (x=0; x<w; x++){
+ for (y=0; y<h; y++) {
+ for (x=0; x<w; x++) {
int d= src1[x + y*stride1] - src2[x + y*stride2];
ssd+= d*d;
//printf("%d", abs(src1[x + y*stride1] - src2[x + y*stride2])/26 );
// test by ref -> src -> dst -> out & compare out against ref
// ref & out are YV12
-static int doTest(uint8_t *ref[3], int refStride[3], int w, int h, int srcFormat, int dstFormat,
- int srcW, int srcH, int dstW, int dstH, int flags){
- uint8_t *src[3];
- uint8_t *dst[3];
- uint8_t *out[3];
- int srcStride[3], dstStride[3];
+static int doTest(uint8_t *ref[4], int refStride[4], int w, int h, int srcFormat, int dstFormat,
+ int srcW, int srcH, int dstW, int dstH, int flags)
+{
+ uint8_t *src[4] = {0};
+ uint8_t *dst[4] = {0};
+ uint8_t *out[4] = {0};
+ int srcStride[4], dstStride[4];
int i;
- uint64_t ssdY, ssdU, ssdV;
- struct SwsContext *srcContext, *dstContext, *outContext;
+ uint64_t ssdY, ssdU=0, ssdV=0, ssdA=0;
+ struct SwsContext *srcContext = NULL, *dstContext = NULL,
+ *outContext = NULL;
int res;
res = 0;
- for (i=0; i<3; i++){
+ for (i=0; i<4; i++) {
// avoid stride % bpp != 0
if (srcFormat==PIX_FMT_RGB24 || srcFormat==PIX_FMT_BGR24)
srcStride[i]= srcW*3;
+ else if (srcFormat==PIX_FMT_RGB48BE || srcFormat==PIX_FMT_RGB48LE)
+ srcStride[i]= srcW*6;
else
srcStride[i]= srcW*4;
if (dstFormat==PIX_FMT_RGB24 || dstFormat==PIX_FMT_BGR24)
dstStride[i]= dstW*3;
+ else if (dstFormat==PIX_FMT_RGB48BE || dstFormat==PIX_FMT_RGB48LE)
+ dstStride[i]= dstW*6;
else
dstStride[i]= dstW*4;
- src[i]= (uint8_t*) malloc(srcStride[i]*srcH);
- dst[i]= (uint8_t*) malloc(dstStride[i]*dstH);
- out[i]= (uint8_t*) malloc(refStride[i]*h);
+ src[i]= malloc(srcStride[i]*srcH);
+ dst[i]= malloc(dstStride[i]*dstH);
+ out[i]= malloc(refStride[i]*h);
if (!src[i] || !dst[i] || !out[i]) {
perror("Malloc");
res = -1;
}
}
- dstContext = outContext = NULL;
- srcContext= sws_getContext(w, h, PIX_FMT_YUV420P, srcW, srcH, srcFormat, flags, NULL, NULL, NULL);
+ srcContext= sws_getContext(w, h, PIX_FMT_YUVA420P, srcW, srcH, srcFormat, flags, NULL, NULL, NULL);
if (!srcContext) {
fprintf(stderr, "Failed to get %s ---> %s\n",
- sws_format_name(PIX_FMT_YUV420P),
+ sws_format_name(PIX_FMT_YUVA420P),
sws_format_name(srcFormat));
res = -1;
goto end;
}
- outContext= sws_getContext(dstW, dstH, dstFormat, w, h, PIX_FMT_YUV420P, flags, NULL, NULL, NULL);
+ outContext= sws_getContext(dstW, dstH, dstFormat, w, h, PIX_FMT_YUVA420P, flags, NULL, NULL, NULL);
if (!outContext) {
fprintf(stderr, "Failed to get %s ---> %s\n",
sws_format_name(dstFormat),
- sws_format_name(PIX_FMT_YUV420P));
+ sws_format_name(PIX_FMT_YUVA420P));
res = -1;
goto end;
sws_scale(dstContext, src, srcStride, 0, srcH, dst, dstStride);
sws_scale(outContext, dst, dstStride, 0, dstH, out, refStride);
-#if defined(ARCH_X86)
- asm volatile ("emms\n\t");
-#endif
-
ssdY= getSSD(ref[0], out[0], refStride[0], refStride[0], w, h);
- ssdU= getSSD(ref[1], out[1], refStride[1], refStride[1], (w+1)>>1, (h+1)>>1);
- ssdV= getSSD(ref[2], out[2], refStride[2], refStride[2], (w+1)>>1, (h+1)>>1);
-
- if (srcFormat == PIX_FMT_GRAY8 || dstFormat==PIX_FMT_GRAY8) ssdU=ssdV=0; //FIXME check that output is really gray
+ if (hasChroma(srcFormat) && hasChroma(dstFormat)) {
+ //FIXME check that output is really gray
+ ssdU= getSSD(ref[1], out[1], refStride[1], refStride[1], (w+1)>>1, (h+1)>>1);
+ ssdV= getSSD(ref[2], out[2], refStride[2], refStride[2], (w+1)>>1, (h+1)>>1);
+ }
+ if (isALPHA(srcFormat) && isALPHA(dstFormat))
+ ssdA= getSSD(ref[3], out[3], refStride[3], refStride[3], w, h);
ssdY/= w*h;
ssdU/= w*h/4;
ssdV/= w*h/4;
+ ssdA/= w*h;
- printf(" %s %dx%d -> %s %4dx%4d flags=%2d SSD=%5lld,%5lld,%5lld\n",
+ printf(" %s %dx%d -> %s %4dx%4d flags=%2d SSD=%5"PRId64",%5"PRId64",%5"PRId64",%5"PRId64"\n",
sws_format_name(srcFormat), srcW, srcH,
sws_format_name(dstFormat), dstW, dstH,
- flags, ssdY, ssdU, ssdV);
+ flags, ssdY, ssdU, ssdV, ssdA);
fflush(stdout);
- end:
+end:
sws_freeContext(srcContext);
sws_freeContext(dstContext);
sws_freeContext(outContext);
- for (i=0; i<3; i++){
+ for (i=0; i<4; i++) {
free(src[i]);
free(dst[i]);
free(out[i]);
return res;
}
-void fast_memcpy(void *a, void *b, int s){ //FIXME
- memcpy(a, b, s);
-}
-
-static void selfTest(uint8_t *src[3], int stride[3], int w, int h){
+static void selfTest(uint8_t *ref[4], int refStride[4], int w, int h)
+{
+ const int flags[] = { SWS_FAST_BILINEAR,
+ SWS_BILINEAR, SWS_BICUBIC,
+ SWS_X , SWS_POINT , SWS_AREA, 0 };
+ const int srcW = w;
+ const int srcH = h;
+ const int dstW[] = { srcW - srcW/3, srcW, srcW + srcW/3, 0 };
+ const int dstH[] = { srcH - srcH/3, srcH, srcH + srcH/3, 0 };
enum PixelFormat srcFormat, dstFormat;
- int srcW, srcH, dstW, dstH;
- int flags;
for (srcFormat = 0; srcFormat < PIX_FMT_NB; srcFormat++) {
for (dstFormat = 0; dstFormat < PIX_FMT_NB; dstFormat++) {
+ int i, j, k;
+ int res = 0;
+
printf("%s -> %s\n",
sws_format_name(srcFormat),
sws_format_name(dstFormat));
fflush(stdout);
- srcW= w;
- srcH= h;
- for (dstW=w - w/3; dstW<= 4*w/3; dstW+= w/3){
- for (dstH=h - h/3; dstH<= 4*h/3; dstH+= h/3){
- for (flags=1; flags<33; flags*=2) {
- int res;
-
- res = doTest(src, stride, w, h, srcFormat, dstFormat,
- srcW, srcH, dstW, dstH, flags);
- if (res < 0) {
- dstW = 4 * w / 3;
- dstH = 4 * h / 3;
- flags = 33;
- }
- }
- }
- }
+ for (i = 0; dstW[i] && !res; i++)
+ for (j = 0; dstH[j] && !res; j++)
+ for (k = 0; flags[k] && !res; k++)
+ res = doTest(ref, refStride, w, h, srcFormat, dstFormat,
+ srcW, srcH, dstW[i], dstH[j], flags[k]);
}
}
}
#define W 96
#define H 96
-int main(int argc, char **argv){
+int main(int argc, char **argv)
+{
uint8_t *rgb_data = malloc (W*H*4);
uint8_t *rgb_src[3]= {rgb_data, NULL, NULL};
int rgb_stride[3]={4*W, 0, 0};
- uint8_t *data = malloc (3*W*H);
- uint8_t *src[3]= {data, data+W*H, data+W*H*2};
- int stride[3]={W, W, W};
+ uint8_t *data = malloc (4*W*H);
+ uint8_t *src[4]= {data, data+W*H, data+W*H*2, data+W*H*3};
+ int stride[4]={W, W, W, W};
int x, y;
struct SwsContext *sws;
+ AVLFG rand;
+
+ if (!rgb_data || !data)
+ return -1;
- sws= sws_getContext(W/12, H/12, PIX_FMT_RGB32, W, H, PIX_FMT_YUV420P, 2, NULL, NULL, NULL);
+ sws= sws_getContext(W/12, H/12, PIX_FMT_RGB32, W, H, PIX_FMT_YUVA420P, SWS_BILINEAR, NULL, NULL, NULL);
- for (y=0; y<H; y++){
- for (x=0; x<W*4; x++){
- rgb_data[ x + y*4*W]= random();
+ av_lfg_init(&rand, 1);
+
+ for (y=0; y<H; y++) {
+ for (x=0; x<W*4; x++) {
+ rgb_data[ x + y*4*W]= av_lfg_get(&rand);
}
}
-#if defined(ARCH_X86)
- sws_rgb2rgb_init(SWS_CPU_CAPS_MMX*0);
-#else
- sws_rgb2rgb_init(0);
-#endif
sws_scale(sws, rgb_src, rgb_stride, 0, H, src, stride);
-
-#if defined(ARCH_X86)
- asm volatile ("emms\n\t");
-#endif
+ sws_freeContext(sws);
+ free(rgb_data);
selfTest(src, stride, W, H);
+ free(data);
- return 123;
+ return 0;
}