MBAFF: Inter support

author Simon Horlick <simonhorlick@gmail.com>

Tue, 29 Mar 2011 19:25:23 +0000 (20:25 +0100)

committer Fiona Glaser <fiona@x264.com>

Thu, 12 May 2011 06:06:07 +0000 (23:06 -0700)
author Simon Horlick <simonhorlick@gmail.com>
Tue, 29 Mar 2011 19:25:23 +0000 (20:25 +0100)
committer Fiona Glaser <fiona@x264.com>
Thu, 12 May 2011 06:06:07 +0000 (23:06 -0700)
diff --git a/common/common.h b/common/common.h

index 743bd6cb56fb56a2ba66cff7558a7437436fcf95..1cc6508db412456fee4a1607f5b3e7fe9e0cc712 100644 (file)
--- a/common/common.h
+++ b/common/common.h
@@ -746,6 +746,10 @@ struct x264_t
              /* neighbor CBPs */
              int     i_cbp_top;
              int     i_cbp_left;
+
+            /* extra data required for mbaff in mv prediction */
+            int16_t topright_mv[2][3][2];
+            int8_t  topright_ref[2][3];
          } cache;
  
          /* */
diff --git a/common/frame.c b/common/frame.c

index 7273f2b327acfc07a33497a010fe0cd2e9b4b11b..c62d94e01d234cc0e088a5a4ee0a2da713428acd 100644 (file)
--- a/common/frame.c
+++ b/common/frame.c
@@ -100,20 +100,35 @@ x264_frame_t *x264_frame_new( x264_t *h, int b_fdec )
  
      CHECKED_MALLOC( frame->buffer[1], chroma_plane_size * sizeof(pixel) );
      frame->plane[1] = frame->buffer[1] + frame->i_stride[1] * i_padv/2 + PADH;
+    if( h->param.b_interlaced )
+    {
+        CHECKED_MALLOC( frame->buffer_fld[1], chroma_plane_size * sizeof(pixel) );
+        frame->plane_fld[1] = frame->buffer_fld[1] + frame->i_stride[1] * i_padv/2 + PADH;
+    }
  
      /* all 4 luma planes allocated together, since the cacheline split code
       * requires them to be in-phase wrt cacheline alignment. */
      if( h->param.analyse.i_subpel_refine && b_fdec )
      {
+        /* FIXME: Don't allocate both buffers in non-adaptive MBAFF. */
          CHECKED_MALLOC( frame->buffer[0], 4*luma_plane_size * sizeof(pixel) );
+        if( h->param.b_interlaced )
+            CHECKED_MALLOC( frame->buffer_fld[0], 4*luma_plane_size * sizeof(pixel) );
          for( int i = 0; i < 4; i++ )
+        {
              frame->filtered[i] = frame->buffer[0] + i*luma_plane_size + frame->i_stride[0] * i_padv + PADH;
+            frame->filtered_fld[i] = frame->buffer_fld[0] + i*luma_plane_size + frame->i_stride[0] * i_padv + PADH;
+        }
          frame->plane[0] = frame->filtered[0];
+        frame->plane_fld[0] = frame->filtered_fld[0];
      }
      else
      {
          CHECKED_MALLOC( frame->buffer[0], luma_plane_size * sizeof(pixel) );
+        if( h->param.b_interlaced )
+            CHECKED_MALLOC( frame->buffer_fld[0], luma_plane_size * sizeof(pixel) );
          frame->filtered[0] = frame->plane[0] = frame->buffer[0] + frame->i_stride[0] * i_padv + PADH;
+        frame->filtered_fld[0] = frame->plane_fld[0] = frame->buffer_fld[0] + frame->i_stride[0] * i_padv + PADH;
      }
  
      frame->b_duplicate = 0;
@@ -200,7 +215,10 @@ void x264_frame_delete( x264_frame_t *frame )
      if( !frame->b_duplicate )
      {
          for( int i = 0; i < 4; i++ )
+        {
              x264_free( frame->buffer[i] );
+            x264_free( frame->buffer_fld[i] );
+        }
          for( int i = 0; i < 4; i++ )
              x264_free( frame->buffer_lowres[i] );
          for( int i = 0; i < X264_BFRAME_MAX+2; i++ )
@@ -363,16 +381,25 @@ void x264_frame_expand_border( x264_t *h, x264_frame_t *frame, int mb_y, int b_e
          int padh = PADH;
          int padv = PADV >> !!i;
          // buffer: 2 chroma, 3 luma (rounded to 4) because deblocking goes beyond the top of the mb
-        pixel *pix = frame->plane[i] + X264_MAX(0, (16*mb_y-4)*stride >> !!i);
          if( b_end && !b_start )
              height += 4 >> (!!i + h->sh.b_mbaff);
+        pixel *pix;
          if( h->sh.b_mbaff )
          {
+            // border samples for each field are extended separately
+            pix = frame->plane_fld[i] + X264_MAX(0, (16*mb_y-4)*stride >> !!i);
              plane_expand_border( pix, stride*2, width, height, padh, padv, b_start, b_end, i );
              plane_expand_border( pix+stride, stride*2, width, height, padh, padv, b_start, b_end, i );
+
+            height = (b_end ? 16*(h->mb.i_mb_height - mb_y) : 32) >> !!i;
+            if( b_end && !b_start )
+                height += 4 >> (!!i);
+            pix = frame->plane[i] + X264_MAX(0, (16*mb_y-4)*stride >> !!i);
+            plane_expand_border( pix, stride, width, height, padh, padv, b_start, b_end, i );
          }
          else
          {
+            pix = frame->plane[i] + X264_MAX(0, (16*mb_y-4)*stride >> !!i);
              plane_expand_border( pix, stride, width, height, padh, padv, b_start, b_end, i );
          }
      }
@@ -392,14 +419,16 @@ void x264_frame_expand_border_filtered( x264_t *h, x264_frame_t *frame, int mb_y
      for( int i = 1; i < 4; i++ )
      {
          // buffer: 8 luma, to match the hpel filter
-        pixel *pix = frame->filtered[i] + (16*mb_y - (8 << h->sh.b_mbaff)) * stride - 4;
+        pixel *pix;
          if( h->sh.b_mbaff )
          {
+            pix = frame->filtered_fld[i] + (16*mb_y - 16) * stride - 4;
              plane_expand_border( pix, stride*2, width, height, padh, padv, b_start, b_end, 0 );
              plane_expand_border( pix+stride, stride*2, width, height, padh, padv, b_start, b_end, 0 );
          }
-        else
-            plane_expand_border( pix, stride, width, height, padh, padv, b_start, b_end, 0 );
+
+        pix = frame->filtered[i] + (16*mb_y - 8) * stride - 4;
+        plane_expand_border( pix, stride, width, height << h->sh.b_mbaff, padh, padv, b_start, b_end, 0 );
      }
  }
  
diff --git a/common/frame.h b/common/frame.h

index 4abef19eaa5c9ec0733d1d0dcb9785905d9f414b..4b86df0eb8ae3a68a8d32070db13262ecdb96bdb 100644 (file)
--- a/common/frame.h
+++ b/common/frame.h
@@ -72,13 +72,16 @@ typedef struct x264_frame
      int     i_width_lowres;
      int     i_lines_lowres;
      pixel *plane[2];
+    pixel *plane_fld[2];
      pixel *filtered[4]; /* plane[0], H, V, HV */
+    pixel *filtered_fld[4];
      pixel *lowres[4]; /* half-size copy of input frame: Orig, H, V, HV */
      uint16_t *integral;
  
      /* for unrestricted mv we allocate more data than needed
       * allocated data are stored in buffer */
      pixel *buffer[4];
+    pixel *buffer_fld[4];
      pixel *buffer_lowres[4];
  
      x264_weight_t weight[X264_REF_MAX][3]; /* [ref_index][plane] */
diff --git a/common/macroblock.c b/common/macroblock.c

index 0a27e6cde96597208aef66bfae61dedc43440200..34a05d4f3cefd3db65fe79816eb29f1d20b3cd53 100644 (file)
--- a/common/macroblock.c
+++ b/common/macroblock.c
@@ -541,15 +541,28 @@ static void ALWAYS_INLINE x264_macroblock_load_pic_pointers( x264_t *h, int mb_x
              else
                  h->mb.pic.p_fdec[0][-1+j*FDEC_STRIDE] = plane_fdec[-1+j*i_stride2];
      }
+    pixel *plane_src, **filtered_src;
      for( int j = 0; j < h->mb.pic.i_fref[0]; j++ )
      {
-        h->mb.pic.p_fref[0][j][i?4:0] = &h->fref[0][j >> b_interlaced]->plane[i][ref_pix_offset[j&1]];
+        // Interpolate between pixels in same field.
+        if( h->mb.b_interlaced )
+        {
+            plane_src = h->fref[0][j>>1]->plane_fld[i];
+            filtered_src = h->fref[0][j>>1]->filtered_fld;
+        }
+        else
+        {
+            plane_src = h->fref[0][j]->plane[i];
+            filtered_src = h->fref[0][j]->filtered;
+        }
+        h->mb.pic.p_fref[0][j][i?4:0] = plane_src + ref_pix_offset[j&1];
+
          if( !i )
          {
              for( int k = 1; k < 4; k++ )
-                h->mb.pic.p_fref[0][j][k] = &h->fref[0][j >> b_interlaced]->filtered[k][ref_pix_offset[j&1]];
+                h->mb.pic.p_fref[0][j][k] = filtered_src[k] + ref_pix_offset[j&1];
              if( h->sh.weight[j][0].weightfn )
-                h->mb.pic.p_fref_w[j] = &h->fenc->weighted[j >> b_interlaced][ref_pix_offset[j&1]];
+                h->mb.pic.p_fref_w[j] = &h->fenc->weighted[j >> h->mb.b_interlaced][ref_pix_offset[j&1]];
              else
                  h->mb.pic.p_fref_w[j] = h->mb.pic.p_fref[0][j][0];
          }
@@ -557,10 +570,21 @@ static void ALWAYS_INLINE x264_macroblock_load_pic_pointers( x264_t *h, int mb_x
      if( h->sh.i_type == SLICE_TYPE_B )
          for( int j = 0; j < h->mb.pic.i_fref[1]; j++ )
          {
-            h->mb.pic.p_fref[1][j][i?4:0] = &h->fref[1][j >> b_interlaced]->plane[i][ref_pix_offset[j&1]];
+            if( h->mb.b_interlaced )
+            {
+                plane_src = h->fref[1][j>>1]->plane_fld[i];
+                filtered_src = h->fref[1][j>>1]->filtered_fld;
+            }
+            else
+            {
+                plane_src = h->fref[1][j]->plane[i];
+                filtered_src = h->fref[1][j]->filtered;
+            }
+            h->mb.pic.p_fref[1][j][i?4:0] = plane_src + ref_pix_offset[j&1];
+
              if( !i )
                  for( int k = 1; k < 4; k++ )
-                    h->mb.pic.p_fref[1][j][k] = &h->fref[1][j >> b_interlaced]->filtered[k][ref_pix_offset[j&1]];
+                    h->mb.pic.p_fref[1][j][k] = filtered_src[k] + ref_pix_offset[j&1];
          }
  }
  
@@ -807,7 +831,9 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
  
      if( h->mb.i_neighbour & MB_LEFT )
      {
-        h->mb.cache.i_cbp_left = cbp[left[0]];
+        const int16_t top_luma = (cbp[left[0]] >> (left_index_table->mv[0]&(~1))) & 2;
+        const int16_t bot_luma = (cbp[left[1]] >> (left_index_table->mv[2]&(~1))) & 2;
+        h->mb.cache.i_cbp_left = (cbp[left[0]] & 0xfff0) | (bot_luma<<2) | top_luma;
  
          /* load intra4x4 */
          h->mb.cache.intra4x4_pred_mode[x264_scan8[0 ] - 1] = i4x4[left[0]][left_index_table->intra[0]];
@@ -859,8 +885,8 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
          h->mb.pic.i_fref[0] = h->i_ref[0] << h->mb.b_interlaced;
          h->mb.pic.i_fref[1] = h->i_ref[1] << h->mb.b_interlaced;
          h->mb.cache.i_neighbour_interlaced =
-            !!(h->mb.i_neighbour & MB_LEFT)
-          + !!(h->mb.i_neighbour & MB_TOP);
+            !!(h->mb.i_neighbour & MB_LEFT && h->mb.field[left[0]])
+          + !!(h->mb.i_neighbour & MB_TOP && h->mb.field[top]);
      }
  
      if( !h->param.b_interlaced )
@@ -897,8 +923,17 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
          int i8 = x264_scan8[0] - 1 - 1*8;
          if( h->mb.i_neighbour & MB_TOPLEFT )
          {
-            h->mb.cache.ref[l][i8] = ref[top_8x8 - 1];
-            CP32( h->mb.cache.mv[l][i8], mv[top_4x4 - 1] );
+            int ir = 2*(s8x8*h->mb.i_mb_topleft_y + mb_x-1)+1+s8x8;
+            int iv = 4*(s4x4*h->mb.i_mb_topleft_y + mb_x-1)+3+3*s4x4;
+            if( h->mb.topleft_partition )
+            {
+                /* Take motion vector from the middle of macroblock instead of
+                 * the bottom right as usual. */
+                iv -= 2*s4x4;
+                ir -= s8x8;
+            }
+            h->mb.cache.ref[l][i8] = ref[ir];
+            CP32( h->mb.cache.mv[l][i8], mv[iv] );
          }
          else
          {
@@ -924,8 +959,8 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
          i8 = x264_scan8[0] + 4 - 1*8;
          if( h->mb.i_neighbour & MB_TOPRIGHT )
          {
-            h->mb.cache.ref[l][i8] = ref[top_8x8 + 2];
-            CP32( h->mb.cache.mv[l][i8], mv[top_4x4 + 4] );
+            h->mb.cache.ref[l][i8] = ref[2*(s8x8*h->mb.i_mb_topright_y + (mb_x+1))+s8x8];
+            CP32( h->mb.cache.mv[l][i8], mv[4*(s4x4*h->mb.i_mb_topright_y + (mb_x+1))+3*s4x4] );
          }
          else
               h->mb.cache.ref[l][i8] = -2;
@@ -933,17 +968,15 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
          i8 = x264_scan8[0] - 1;
          if( h->mb.i_neighbour & MB_LEFT )
          {
-            const int ir = h->mb.i_b8_xy - 1;
-            const int iv = h->mb.i_b4_xy - 1;
-            h->mb.cache.ref[l][i8+0*8] =
-            h->mb.cache.ref[l][i8+1*8] = ref[ir + 0*s8x8];
-            h->mb.cache.ref[l][i8+2*8] =
-            h->mb.cache.ref[l][i8+3*8] = ref[ir + 1*s8x8];
-
-            CP32( h->mb.cache.mv[l][i8+0*8], mv[iv + 0*s4x4] );
-            CP32( h->mb.cache.mv[l][i8+1*8], mv[iv + 1*s4x4] );
-            CP32( h->mb.cache.mv[l][i8+2*8], mv[iv + 2*s4x4] );
-            CP32( h->mb.cache.mv[l][i8+3*8], mv[iv + 3*s4x4] );
+            h->mb.cache.ref[l][i8+0*8] = ref[h->mb.left_b8[0] + 1 + s8x8*left_index_table->ref[0]];
+            h->mb.cache.ref[l][i8+1*8] = ref[h->mb.left_b8[0] + 1 + s8x8*left_index_table->ref[1]];
+            h->mb.cache.ref[l][i8+2*8] = ref[h->mb.left_b8[1] + 1 + s8x8*left_index_table->ref[2]];
+            h->mb.cache.ref[l][i8+3*8] = ref[h->mb.left_b8[1] + 1 + s8x8*left_index_table->ref[3]];
+
+            CP32( h->mb.cache.mv[l][i8+0*8], mv[h->mb.left_b4[0] + 3 + s4x4*left_index_table->mv[0]] );
+            CP32( h->mb.cache.mv[l][i8+1*8], mv[h->mb.left_b4[0] + 3 + s4x4*left_index_table->mv[1]] );
+            CP32( h->mb.cache.mv[l][i8+2*8], mv[h->mb.left_b4[1] + 3 + s4x4*left_index_table->mv[2]] );
+            CP32( h->mb.cache.mv[l][i8+3*8], mv[h->mb.left_b4[1] + 3 + s4x4*left_index_table->mv[3]] );
          }
          else
          {
@@ -954,6 +987,39 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
              }
          }
  
+        /* Extra logic for top right mv in mbaff.
+         * . . . d  . . a .
+         * . . . e  . . . .
+         * . . . f  b . c .
+         * . . . .  . . . .
+         *
+         * If the top right of the 4x4 partitions labeled a, b and c in the
+         * above diagram do not exist, but the entries d, e and f exist (in
+         * the macroblock to the left) then use those instead.
+         */
+        if( h->sh.b_mbaff && (h->mb.i_neighbour & MB_LEFT) )
+        {
+            if( h->mb.b_interlaced && !h->mb.field[h->mb.i_mb_xy-1] )
+            {
+                h->mb.cache.topright_ref[l][0] = ref[h->mb.left_b8[0] + 1 + s8x8*0];
+                h->mb.cache.topright_ref[l][1] = ref[h->mb.left_b8[0] + 1 + s8x8*1];
+                h->mb.cache.topright_ref[l][2] = ref[h->mb.left_b8[1] + 1 + s8x8*0];
+                CP32( h->mb.cache.topright_mv[l][0], mv[h->mb.left_b4[0] + 3 + s4x4*(left_index_table->mv[0]+1)] );
+                CP32( h->mb.cache.topright_mv[l][1], mv[h->mb.left_b4[0] + 3 + s4x4*(left_index_table->mv[1]+1)] );
+                CP32( h->mb.cache.topright_mv[l][2], mv[h->mb.left_b4[1] + 3 + s4x4*(left_index_table->mv[2]+1)] );
+            }
+            else if( !h->mb.b_interlaced && h->mb.field[h->mb.i_mb_xy-1] )
+            {
+                // Looking at the bottom field so always take the bottom macroblock of the pair.
+                h->mb.cache.topright_ref[l][0] = ref[h->mb.left_b8[0] + 1 + s8x8*2 + s8x8*left_index_table->ref[0]];
+                h->mb.cache.topright_ref[l][1] = ref[h->mb.left_b8[0] + 1 + s8x8*2 + s8x8*left_index_table->ref[0]];
+                h->mb.cache.topright_ref[l][2] = ref[h->mb.left_b8[0] + 1 + s8x8*2 + s8x8*left_index_table->ref[2]];
+                CP32( h->mb.cache.topright_mv[l][0], mv[h->mb.left_b4[0] + 3 + s4x4*4 + s4x4*left_index_table->mv[0]] );
+                CP32( h->mb.cache.topright_mv[l][1], mv[h->mb.left_b4[0] + 3 + s4x4*4 + s4x4*left_index_table->mv[1]] );
+                CP32( h->mb.cache.topright_mv[l][2], mv[h->mb.left_b4[0] + 3 + s4x4*4 + s4x4*left_index_table->mv[2]] );
+            }
+        }
+
          if( h->param.b_cabac )
          {
              uint8_t (*mvd)[8][2] = h->mb.mvd[l];
@@ -962,16 +1028,84 @@ void x264_macroblock_cache_load( x264_t *h, int mb_x, int mb_y )
              else
                  M64( h->mb.cache.mvd[l][x264_scan8[0] - 8] ) = 0;
  
-            if( h->mb.i_neighbour & MB_LEFT )
+            if( h->mb.cache.ref[l][x264_scan8[0]-1] >= 0 )
              {
                  CP16( h->mb.cache.mvd[l][x264_scan8[0 ] - 1], mvd[left[0]][left_index_table->intra[0]] );
                  CP16( h->mb.cache.mvd[l][x264_scan8[2 ] - 1], mvd[left[0]][left_index_table->intra[1]] );
+            }
+            else
+            {
+                M16( h->mb.cache.mvd[l][x264_scan8[0]-1+0*8] ) = 0;
+                M16( h->mb.cache.mvd[l][x264_scan8[0]-1+1*8] ) = 0;
+            }
+            if( h->mb.cache.ref[l][x264_scan8[0]-1+2*8] >=0 )
+            {
                  CP16( h->mb.cache.mvd[l][x264_scan8[8 ] - 1], mvd[left[1]][left_index_table->intra[2]] );
                  CP16( h->mb.cache.mvd[l][x264_scan8[10] - 1], mvd[left[1]][left_index_table->intra[3]] );
              }
              else
-                for( int i = 0; i < 4; i++ )
-                    M16( h->mb.cache.mvd[l][x264_scan8[0]-1+i*8] ) = 0;
+            {
+                M16( h->mb.cache.mvd[l][x264_scan8[0]-1+2*8] ) = 0;
+                M16( h->mb.cache.mvd[l][x264_scan8[0]-1+3*8] ) = 0;
+            }
+        }
+
+        /* If motion vectors are cached from frame macroblocks but this
+         * macroblock is a field macroblock then the motion vector must be
+         * halved. Similarly, motion vectors from field macroblocks are doubled. */
+        if( h->sh.b_mbaff )
+        {
+#define MAP_MVS\
+                if( FIELD_DIFFERENT(h->mb.i_mb_topleft_xy) )\
+                    MAP_F2F(mv, ref, x264_scan8[0] - 1 - 1*8)\
+                if( FIELD_DIFFERENT(top) )\
+                {\
+                    MAP_F2F(mv, ref, x264_scan8[0] + 0 - 1*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] + 1 - 1*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] + 2 - 1*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] + 3 - 1*8)\
+                }\
+                if( FIELD_DIFFERENT(h->mb.i_mb_topright_xy) )\
+                    MAP_F2F(mv, ref, x264_scan8[0] + 4 - 1*8)\
+                if( FIELD_DIFFERENT(left[0]) )\
+                {\
+                    MAP_F2F(mv, ref, x264_scan8[0] - 1 + 0*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] - 1 + 1*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] - 1 + 2*8)\
+                    MAP_F2F(mv, ref, x264_scan8[0] - 1 + 3*8)\
+                    MAP_F2F(topright_mv, topright_ref, 0)\
+                    MAP_F2F(topright_mv, topright_ref, 1)\
+                    MAP_F2F(topright_mv, topright_ref, 2)\
+                }
+
+            if( h->mb.b_interlaced )
+            {
+#define FIELD_DIFFERENT(macroblock) (macroblock >= 0 && !h->mb.field[macroblock])
+#define MAP_F2F(varmv, varref, index)\
+                if( h->mb.cache.varref[l][index] >= 0 )\
+                {\
+                    h->mb.cache.varref[l][index] <<= 1;\
+                    h->mb.cache.varmv[l][index][1] /= 2;\
+                    h->mb.cache.mvd[l][index][1] >>= 1;\
+                }
+                MAP_MVS
+#undef MAP_F2F
+#undef FIELD_DIFFERENT
+            }
+            else
+            {
+#define FIELD_DIFFERENT(macroblock) (macroblock >= 0 && h->mb.field[macroblock])
+#define MAP_F2F(varmv, varref, index)\
+                if( h->mb.cache.varref[l][index] >= 0 )\
+                {\
+                    h->mb.cache.varref[l][index] >>= 1;\
+                    h->mb.cache.varmv[l][index][1] <<= 1;\
+                    h->mb.cache.mvd[l][index][1] <<= 1;\
+                }
+                MAP_MVS
+#undef MAP_F2F
+#undef FIELD_DIFFERENT
+            }
          }
      }
  
diff --git a/common/mc.c b/common/mc.c

index 76061c32a237fd86eedea7d492e442e3a0a29e27..4e727e2d6bc858a8de8058d3672b1fca3240c5b4 100644 (file)
--- a/common/mc.c
+++ b/common/mc.c
@@ -511,18 +511,17 @@ void x264_mc_init( int cpu, x264_mc_functions_t *pf )
  
  void x264_frame_filter( x264_t *h, x264_frame_t *frame, int mb_y, int b_end )
  {
-    const int b_interlaced = h->sh.b_mbaff;
-    const int stride = frame->i_stride[0] << b_interlaced;
+    const int b_interlaced = h->param.b_interlaced;
+    int stride = frame->i_stride[0];
      const int width = frame->i_width[0];
-    int start = (mb_y*16 >> b_interlaced) - 8; // buffer = 4 for deblock + 3 for 6tap, rounded to 8
-    int height = ((b_end ? frame->i_lines[0] : mb_y*16) >> b_interlaced) + 8;
+    int start = mb_y*16 - 8; // buffer = 4 for deblock + 3 for 6tap, rounded to 8
+    int height = (b_end ? frame->i_lines[0] + 16*h->param.b_interlaced : (mb_y+b_interlaced)*16) + 8;
      int offs = start*stride - 8; // buffer = 3 for 6tap, aligned to 8 for simd
  
      if( mb_y & b_interlaced )
          return;
  
-    for( int y = 0; y <= b_interlaced; y++, offs += frame->i_stride[0] )
-    {
+    if( !b_interlaced || h->mb.b_adaptive_mbaff )
          h->mc.hpel_filter(
              frame->filtered[1] + offs,
              frame->filtered[2] + offs,
@@ -530,6 +529,24 @@ void x264_frame_filter( x264_t *h, x264_frame_t *frame, int mb_y, int b_end )
              frame->plane[0] + offs,
              stride, width + 16, height - start,
              h->scratch_buffer );
+
+    if( b_interlaced )
+    {
+        /* MC must happen between pixels in the same field. */
+        stride = frame->i_stride[0] << 1;
+        start = (mb_y*16 >> 1) - 8;
+        int height_fld = ((b_end ? frame->i_lines[0] : mb_y*16) >> 1) + 8;
+        offs = start*stride - 8;
+        for( int i = 0; i < 2; i++, offs += frame->i_stride[0] )
+        {
+            h->mc.hpel_filter(
+                frame->filtered_fld[1] + offs,
+                frame->filtered_fld[2] + offs,
+                frame->filtered_fld[3] + offs,
+                frame->plane_fld[0] + offs,
+                stride, width + 16, height_fld - start,
+                h->scratch_buffer );
+        }
      }
  
      /* generate integral image:
diff --git a/common/mvpred.c b/common/mvpred.c

index 304bfca5791b1b5e35ee1b54d5bec6ea2dd7fb1c..6d4f608537116ba769d452ad36cd61b90f5a9c7a 100644 (file)
--- a/common/mvpred.c
+++ b/common/mvpred.c
@@ -38,12 +38,33 @@ void x264_mb_predict_mv( x264_t *h, int i_list, int idx, int i_width, int16_t mv
      int     i_refc = h->mb.cache.ref[i_list][i8 - 8 + i_width];
      int16_t *mv_c  = h->mb.cache.mv[i_list][i8 - 8 + i_width];
  
+    // Partitions not yet reached in scan order are unavailable.
      if( (idx&3) >= 2 + (i_width&1) || i_refc == -2 )
      {
          i_refc = h->mb.cache.ref[i_list][i8 - 8 - 1];
          mv_c   = h->mb.cache.mv[i_list][i8 - 8 - 1];
-    }
  
+        if( h->sh.b_mbaff
+            && h->mb.cache.ref[i_list][x264_scan8[0]-1] != -2
+            && h->mb.b_interlaced != h->mb.field[h->mb.i_mb_left_xy[0]] )
+        {
+            if( idx == 2 )
+            {
+                mv_c = h->mb.cache.topright_mv[i_list][0];
+                i_refc = h->mb.cache.topright_ref[i_list][0];
+            }
+            else if( idx == 8 )
+            {
+                mv_c = h->mb.cache.topright_mv[i_list][1];
+                i_refc = h->mb.cache.topright_ref[i_list][1];
+            }
+            else if( idx == 10 )
+            {
+                mv_c = h->mb.cache.topright_mv[i_list][2];
+                i_refc = h->mb.cache.topright_ref[i_list][2];
+            }
+        }
+    }
      if( h->mb.i_partition == D_16x8 )
      {
          if( idx == 0 )
author	Simon Horlick <simonhorlick@gmail.com>
	Tue, 29 Mar 2011 19:25:23 +0000 (20:25 +0100)
committer	Fiona Glaser <fiona@x264.com>
	Thu, 12 May 2011 06:06:07 +0000 (23:06 -0700)
common/common.h		patch \| blob \| history
common/frame.c		patch \| blob \| history
common/frame.h		patch \| blob \| history
common/macroblock.c		patch \| blob \| history
common/mc.c		patch \| blob \| history
common/mvpred.c		patch \| blob \| history