X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=common%2Fpixel.h;h=35be44ca2cbc665e0b8e92e0ec4318cc8a24adc6;hb=88af51b0bbe92bf6868cb4fb81b147ea6e0e0eed;hp=f8012bab0898e7a1ce94ea5f9f1968ad889dcb0b;hpb=d69837d312aa09c020416008c26f7008783d8c7f;p=x264 diff --git a/common/pixel.h b/common/pixel.h index f8012bab..35be44ca 100644 --- a/common/pixel.h +++ b/common/pixel.h @@ -1,10 +1,11 @@ /***************************************************************************** - * pixel.h: h264 encoder library + * pixel.c: pixel metrics ***************************************************************************** - * Copyright (C) 2003 Laurent Aimar - * $Id: pixel.h,v 1.1 2004/06/03 19:27:07 fenrir Exp $ + * Copyright (C) 2004-2016 x264 project * - * Authors: Laurent Aimar + * Authors: Loren Merritt + * Fiona Glaser + Henrik Gramner * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by @@ -18,13 +19,20 @@ * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software - * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111, USA. + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA. + * + * This program is also available under a commercial proprietary license. + * For more information, contact us at licensing@x264.com. *****************************************************************************/ -#ifndef _PIXEL_H -#define _PIXEL_H 1 +#ifndef X264_PIXEL_H +#define X264_PIXEL_H -typedef int (*x264_pixel_cmp_t) ( uint8_t *, int, uint8_t *, int ); +// SSD assumes all args aligned +// other cmp functions assume first arg aligned +typedef int (*x264_pixel_cmp_t) ( pixel *, intptr_t, pixel *, intptr_t ); +typedef void (*x264_pixel_cmp_x3_t) ( pixel *, pixel *, pixel *, pixel *, intptr_t, int[3] ); +typedef void (*x264_pixel_cmp_x4_t) ( pixel *, pixel *, pixel *, pixel *, pixel *, intptr_t, int[4] ); enum { @@ -35,23 +43,23 @@ enum PIXEL_8x4 = 4, PIXEL_4x8 = 5, PIXEL_4x4 = 6, - PIXEL_4x2 = 7, - PIXEL_2x4 = 8, - PIXEL_2x2 = 9, + + /* Subsampled chroma only */ + PIXEL_4x16 = 7, /* 4:2:2 */ + PIXEL_4x2 = 8, + PIXEL_2x8 = 9, /* 4:2:2 */ + PIXEL_2x4 = 10, + PIXEL_2x2 = 11, }; -static const struct { - int w; - int h; -} x264_pixel_size[7] = { - { 16, 16 }, - { 16, 8 }, { 8, 16 }, - { 8, 8 }, - { 8, 4 }, { 4, 8 }, - { 4, 4 } +static const struct { uint8_t w, h; } x264_pixel_size[12] = +{ + { 16, 16 }, { 16, 8 }, { 8, 16 }, { 8, 8 }, { 8, 4 }, { 4, 8 }, { 4, 4 }, + { 4, 16 }, { 4, 2 }, { 2, 8 }, { 2, 4 }, { 2, 2 }, }; -static const int x264_size2pixel[5][5] = { +static const uint8_t x264_size2pixel[5][5] = +{ { 0, }, { 0, PIXEL_4x4, PIXEL_8x4, 0, 0 }, { 0, PIXEL_4x8, PIXEL_8x8, 0, PIXEL_16x8 }, @@ -59,16 +67,90 @@ static const int x264_size2pixel[5][5] = { { 0, 0, PIXEL_8x16, 0, PIXEL_16x16 } }; +static const uint8_t x264_luma2chroma_pixel[4][7] = +{ + { 0 }, + { PIXEL_8x8, PIXEL_8x4, PIXEL_4x8, PIXEL_4x4, PIXEL_4x2, PIXEL_2x4, PIXEL_2x2 }, /* 4:2:0 */ + { PIXEL_8x16, PIXEL_8x8, PIXEL_4x16, PIXEL_4x8, PIXEL_4x4, PIXEL_2x8, PIXEL_2x4 }, /* 4:2:2 */ + { PIXEL_16x16, PIXEL_16x8, PIXEL_8x16, PIXEL_8x8, PIXEL_8x4, PIXEL_4x8, PIXEL_4x4 }, /* 4:4:4 */ +}; + typedef struct { - x264_pixel_cmp_t sad[7]; - x264_pixel_cmp_t ssd[7]; - x264_pixel_cmp_t satd[7]; + x264_pixel_cmp_t sad[8]; + x264_pixel_cmp_t ssd[8]; + x264_pixel_cmp_t satd[8]; + x264_pixel_cmp_t ssim[7]; x264_pixel_cmp_t sa8d[4]; - x264_pixel_cmp_t mbcmp[7]; /* either satd or sad for subpel refine and mode decision */ + x264_pixel_cmp_t mbcmp[8]; /* either satd or sad for subpel refine and mode decision */ + x264_pixel_cmp_t mbcmp_unaligned[8]; /* unaligned mbcmp for subpel */ + x264_pixel_cmp_t fpelcmp[8]; /* either satd or sad for fullpel motion search */ + x264_pixel_cmp_x3_t fpelcmp_x3[7]; + x264_pixel_cmp_x4_t fpelcmp_x4[7]; + x264_pixel_cmp_t sad_aligned[8]; /* Aligned SAD for mbcmp */ + int (*vsad)( pixel *, intptr_t, int ); + int (*asd8)( pixel *pix1, intptr_t stride1, pixel *pix2, intptr_t stride2, int height ); + uint64_t (*sa8d_satd[1])( pixel *pix1, intptr_t stride1, pixel *pix2, intptr_t stride2 ); + + uint64_t (*var[4])( pixel *pix, intptr_t stride ); + int (*var2[4])( pixel *pix1, intptr_t stride1, + pixel *pix2, intptr_t stride2, int *ssd ); + uint64_t (*hadamard_ac[4])( pixel *pix, intptr_t stride ); + + void (*ssd_nv12_core)( pixel *pixuv1, intptr_t stride1, + pixel *pixuv2, intptr_t stride2, int width, int height, + uint64_t *ssd_u, uint64_t *ssd_v ); + void (*ssim_4x4x2_core)( const pixel *pix1, intptr_t stride1, + const pixel *pix2, intptr_t stride2, int sums[2][4] ); + float (*ssim_end4)( int sum0[5][4], int sum1[5][4], int width ); + + /* multiple parallel calls to cmp. */ + x264_pixel_cmp_x3_t sad_x3[7]; + x264_pixel_cmp_x4_t sad_x4[7]; + x264_pixel_cmp_x3_t satd_x3[7]; + x264_pixel_cmp_x4_t satd_x4[7]; + + /* abs-diff-sum for successive elimination. + * may round width up to a multiple of 16. */ + int (*ads[7])( int enc_dc[4], uint16_t *sums, int delta, + uint16_t *cost_mvx, int16_t *mvs, int width, int thresh ); + + /* calculate satd or sad of V, H, and DC modes. */ + void (*intra_mbcmp_x3_16x16)( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_satd_x3_16x16) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_sad_x3_16x16) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_mbcmp_x3_4x4) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_satd_x3_4x4) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_sad_x3_4x4) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_mbcmp_x3_chroma)( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_satd_x3_chroma) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_sad_x3_chroma) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_mbcmp_x3_8x16c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_satd_x3_8x16c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_sad_x3_8x16c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_mbcmp_x3_8x8c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_satd_x3_8x8c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_sad_x3_8x8c) ( pixel *fenc, pixel *fdec, int res[3] ); + void (*intra_mbcmp_x3_8x8) ( pixel *fenc, pixel edge[36], int res[3] ); + void (*intra_sa8d_x3_8x8) ( pixel *fenc, pixel edge[36], int res[3] ); + void (*intra_sad_x3_8x8) ( pixel *fenc, pixel edge[36], int res[3] ); + /* find minimum satd or sad of all modes, and set fdec. + * may be NULL, in which case just use pred+satd instead. */ + int (*intra_mbcmp_x9_4x4)( pixel *fenc, pixel *fdec, uint16_t *bitcosts ); + int (*intra_satd_x9_4x4) ( pixel *fenc, pixel *fdec, uint16_t *bitcosts ); + int (*intra_sad_x9_4x4) ( pixel *fenc, pixel *fdec, uint16_t *bitcosts ); + int (*intra_mbcmp_x9_8x8)( pixel *fenc, pixel *fdec, pixel edge[36], uint16_t *bitcosts, uint16_t *satds ); + int (*intra_sa8d_x9_8x8) ( pixel *fenc, pixel *fdec, pixel edge[36], uint16_t *bitcosts, uint16_t *satds ); + int (*intra_sad_x9_8x8) ( pixel *fenc, pixel *fdec, pixel edge[36], uint16_t *bitcosts, uint16_t *satds ); } x264_pixel_function_t; void x264_pixel_init( int cpu, x264_pixel_function_t *pixf ); -int64_t x264_pixel_ssd_wxh( x264_pixel_function_t *pf, uint8_t *pix1, int i_pix1, uint8_t *pix2, int i_pix2, int i_width, int i_height ); +void x264_pixel_ssd_nv12 ( x264_pixel_function_t *pf, pixel *pix1, intptr_t i_pix1, pixel *pix2, intptr_t i_pix2, + int i_width, int i_height, uint64_t *ssd_u, uint64_t *ssd_v ); +uint64_t x264_pixel_ssd_wxh( x264_pixel_function_t *pf, pixel *pix1, intptr_t i_pix1, pixel *pix2, intptr_t i_pix2, + int i_width, int i_height ); +float x264_pixel_ssim_wxh ( x264_pixel_function_t *pf, pixel *pix1, intptr_t i_pix1, pixel *pix2, intptr_t i_pix2, + int i_width, int i_height, void *buf, int *cnt ); +int x264_field_vsad( x264_t *h, int mb_x, int mb_y ); #endif