h264dec: add forgotten copying of h->sync

[ffmpeg] / libavcodec / h264.c
diff --git a/libavcodec/h264.c b/libavcodec/h264.c

index 08d66cd2e75d97d9957b4ad37728e40d620949d2..9e2b55426b179e411b661d33bbb92925daec50bb 100644 (file)
--- a/libavcodec/h264.c
+++ b/libavcodec/h264.c
@@ -174,20 +174,28 @@ const uint8_t *ff_h264_decode_nal(H264Context *h, const uint8_t *src, int *dst_l
          i-= RS;
      }
  
-    if(i>=length-1){ //no escaped 0
-        *dst_length= length;
-        *consumed= length+1; //+1 for the header
-        return src;
-    }
-
      bufidx = h->nal_unit_type == NAL_DPC ? 1 : 0; // use second escape buffer for inter data
-    av_fast_malloc(&h->rbsp_buffer[bufidx], &h->rbsp_buffer_size[bufidx], length+FF_INPUT_BUFFER_PADDING_SIZE);
+    si=h->rbsp_buffer_size[bufidx];
+    av_fast_malloc(&h->rbsp_buffer[bufidx], &h->rbsp_buffer_size[bufidx], length+FF_INPUT_BUFFER_PADDING_SIZE+MAX_MBPAIR_SIZE);
      dst= h->rbsp_buffer[bufidx];
+    if(si != h->rbsp_buffer_size[bufidx])
+        memset(dst + length, 0, FF_INPUT_BUFFER_PADDING_SIZE+MAX_MBPAIR_SIZE);
  
      if (dst == NULL){
          return NULL;
      }
  
+    if(i>=length-1){ //no escaped 0
+        *dst_length= length;
+        *consumed= length+1; //+1 for the header
+        if(h->s.avctx->flags2 & CODEC_FLAG2_FAST){
+            return src;
+        }else{
+            memcpy(dst, src, length);
+            return dst;
+        }
+    }
+
  //printf("decoding esc\n");
      memcpy(dst, src, i);
      si=di=i;
@@ -942,7 +950,7 @@ static void clone_tables(H264Context *dst, H264Context *src, int i){
      dst->list_counts              = src->list_counts;
  
      dst->s.obmc_scratchpad = NULL;
-    ff_h264_pred_init(&dst->hpc, src->s.codec_id, src->sps.bit_depth_luma);
+    ff_h264_pred_init(&dst->hpc, src->s.codec_id, src->sps.bit_depth_luma, src->sps.chroma_format_idc);
  }
  
  /**
@@ -970,8 +978,8 @@ static av_cold void common_init(H264Context *h){
      s->height = s->avctx->height;
      s->codec_id= s->avctx->codec->id;
  
-    ff_h264dsp_init(&h->h264dsp, 8);
-    ff_h264_pred_init(&h->hpc, s->codec_id, 8);
+    ff_h264dsp_init(&h->h264dsp, 8, 1);
+    ff_h264_pred_init(&h->hpc, s->codec_id, 8, 1);
  
      h->dequant_coeff_pps= -1;
      s->unrestricted_mv=1;
@@ -1138,7 +1146,10 @@ static int decode_update_thread_context(AVCodecContext *dst, const AVCodecContex
          memcpy(&h->s + 1, &h1->s + 1, sizeof(H264Context) - sizeof(MpegEncContext)); //copy all fields after MpegEnc
          memset(h->sps_buffers, 0, sizeof(h->sps_buffers));
          memset(h->pps_buffers, 0, sizeof(h->pps_buffers));
-        ff_h264_alloc_tables(h);
+        if (ff_h264_alloc_tables(h) < 0) {
+            av_log(dst, AV_LOG_ERROR, "Could not allocate memory for h264\n");
+            return AVERROR(ENOMEM);
+        }
          context_init(h);
  
          for(i=0; i<2; i++){
@@ -1190,11 +1201,12 @@ static int decode_update_thread_context(AVCodecContext *dst, const AVCodecContex
      copy_picture_range(h->delayed_pic, h1->delayed_pic, MAX_DELAYED_PIC_COUNT+2, s, s1);
  
      h->last_slice_type = h1->last_slice_type;
+    h->sync            = h1->sync;
  
      if(!s->current_picture_ptr) return 0;
  
      if(!s->dropable) {
-        ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index);
+        err = ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index);
          h->prev_poc_msb     = h->poc_msb;
          h->prev_poc_lsb     = h->poc_lsb;
      }
@@ -1202,7 +1214,7 @@ static int decode_update_thread_context(AVCodecContext *dst, const AVCodecContex
      h->prev_frame_num       = h->frame_num;
      h->outputed_poc         = h->next_outputed_poc;
  
-    return 0;
+    return err;
  }
  
  int ff_h264_frame_start(H264Context *h){
@@ -1376,7 +1388,7 @@ static void decode_postinit(H264Context *h, int setup_finished){
      pics = 0;
      while(h->delayed_pic[pics]) pics++;
  
-    assert(pics <= MAX_DELAYED_PIC_COUNT);
+    av_assert0(pics <= MAX_DELAYED_PIC_COUNT);
  
      h->delayed_pic[pics++] = cur;
      if (cur->f.reference == 0)
@@ -1421,15 +1433,21 @@ static void decode_postinit(H264Context *h, int setup_finished){
          av_log(s->avctx, AV_LOG_DEBUG, "no picture\n");
      }
  
+    if (h->next_output_pic && h->next_output_pic->sync) {
+        h->sync |= 2*!!h->next_output_pic->f.key_frame;
+    }
+
      if (setup_finished)
          ff_thread_finish_setup(s->avctx);
  }
  
-static av_always_inline void backup_mb_border(H264Context *h, uint8_t *src_y, uint8_t *src_cb, uint8_t *src_cr, int linesize, int uvlinesize, int chroma444, int simple){
+static av_always_inline void backup_mb_border(H264Context *h, uint8_t *src_y, uint8_t *src_cb, uint8_t *src_cr, int linesize, int uvlinesize, int simple){
      MpegEncContext * const s = &h->s;
      uint8_t *top_border;
      int top_idx = 1;
      const int pixel_shift = h->pixel_shift;
+    int chroma444 = CHROMA444;
+    int chroma422 = CHROMA422;
  
      src_y  -=   linesize;
      src_cb -= uvlinesize;
@@ -1453,6 +1471,14 @@ static av_always_inline void backup_mb_border(H264Context *h, uint8_t *src_y, ui
                              AV_COPY128(top_border+16, src_cb + 15*uvlinesize);
                              AV_COPY128(top_border+32, src_cr + 15*uvlinesize);
                          }
+                    } else if(chroma422){
+                        if (pixel_shift) {
+                            AV_COPY128(top_border+32, src_cb + 15*uvlinesize);
+                            AV_COPY128(top_border+48, src_cr + 15*uvlinesize);
+                        } else {
+                            AV_COPY64(top_border+16, src_cb +  15*uvlinesize);
+                            AV_COPY64(top_border+24, src_cr +  15*uvlinesize);
+                        }
                      } else {
                          if (pixel_shift) {
                              AV_COPY128(top_border+32, src_cb+7*uvlinesize);
@@ -1488,6 +1514,14 @@ static av_always_inline void backup_mb_border(H264Context *h, uint8_t *src_y, ui
                  AV_COPY128(top_border+16, src_cb + 16*linesize);
                  AV_COPY128(top_border+32, src_cr + 16*linesize);
              }
+        } else if(chroma422) {
+            if (pixel_shift) {
+                AV_COPY128(top_border+32, src_cb+16*uvlinesize);
+                AV_COPY128(top_border+48, src_cr+16*uvlinesize);
+            } else {
+                AV_COPY64(top_border+16, src_cb+16*uvlinesize);
+                AV_COPY64(top_border+24, src_cr+16*uvlinesize);
+            }
          } else {
              if (pixel_shift) {
                  AV_COPY128(top_border+32, src_cb+8*uvlinesize);
@@ -1766,10 +1800,11 @@ static av_always_inline void hl_decode_mb_internal(H264Context *h, int simple, i
      /* is_h264 should always be true if SVQ3 is disabled. */
      const int is_h264 = !CONFIG_SVQ3_DECODER || simple || s->codec_id == CODEC_ID_H264;
      void (*idct_add)(uint8_t *dst, DCTELEM *block, int stride);
+    const int block_h = 16>>s->chroma_y_shift;
  
      dest_y  = s->current_picture.f.data[0] + ((mb_x << pixel_shift) + mb_y * s->linesize  ) * 16;
-    dest_cb = s->current_picture.f.data[1] + ((mb_x << pixel_shift) + mb_y * s->uvlinesize) *  8;
-    dest_cr = s->current_picture.f.data[2] + ((mb_x << pixel_shift) + mb_y * s->uvlinesize) *  8;
+    dest_cb = s->current_picture.f.data[1] + (mb_x << pixel_shift)*8 + mb_y * s->uvlinesize * block_h;
+    dest_cr = s->current_picture.f.data[2] + (mb_x << pixel_shift)*8 + mb_y * s->uvlinesize * block_h;
  
      s->dsp.prefetch(dest_y + (s->mb_x&3)*4*s->linesize + (64 << pixel_shift), s->linesize, 4);
      s->dsp.prefetch(dest_cb + (s->mb_x&7)*s->uvlinesize + (64 << pixel_shift), dest_cr - dest_cb, 2);
@@ -1782,8 +1817,8 @@ static av_always_inline void hl_decode_mb_internal(H264Context *h, int simple, i
          block_offset = &h->block_offset[48];
          if(mb_y&1){ //FIXME move out of this function?
              dest_y -= s->linesize*15;
-            dest_cb-= s->uvlinesize*7;
-            dest_cr-= s->uvlinesize*7;
+            dest_cb-= s->uvlinesize*(block_h-1);
+            dest_cr-= s->uvlinesize*(block_h-1);
          }
          if(FRAME_MBAFF) {
              int list;
@@ -1830,16 +1865,16 @@ static av_always_inline void hl_decode_mb_internal(H264Context *h, int simple, i
                          }
                      }
                  } else {
-                for (i = 0; i < 8; i++) {
-                    uint16_t *tmp_cb = (uint16_t*)(dest_cb + i*uvlinesize);
-                    for (j = 0; j < 8; j++)
-                        tmp_cb[j] = get_bits(&gb, bit_depth);
-                }
-                for (i = 0; i < 8; i++) {
-                    uint16_t *tmp_cr = (uint16_t*)(dest_cr + i*uvlinesize);
-                    for (j = 0; j < 8; j++)
-                        tmp_cr[j] = get_bits(&gb, bit_depth);
-                }
+                    for (i = 0; i < block_h; i++) {
+                        uint16_t *tmp_cb = (uint16_t*)(dest_cb + i*uvlinesize);
+                        for (j = 0; j < 8; j++)
+                            tmp_cb[j] = get_bits(&gb, bit_depth);
+                    }
+                    for (i = 0; i < block_h; i++) {
+                        uint16_t *tmp_cr = (uint16_t*)(dest_cr + i*uvlinesize);
+                        for (j = 0; j < 8; j++)
+                            tmp_cr[j] = get_bits(&gb, bit_depth);
+                    }
                  }
              }
          } else {
@@ -1853,10 +1888,10 @@ static av_always_inline void hl_decode_mb_internal(H264Context *h, int simple, i
                          memset(dest_cr+ i*uvlinesize, 1 << (bit_depth - 1), 8);
                      }
                  } else {
-                for (i=0; i<8; i++) {
-                    memcpy(dest_cb+ i*uvlinesize, h->mb + 128 + i*4,  8);
-                    memcpy(dest_cr+ i*uvlinesize, h->mb + 160 + i*4,  8);
-                }
+                    for (i=0; i<block_h; i++) {
+                        memcpy(dest_cb+ i*uvlinesize, h->mb + 128 + i*4,  8);
+                        memcpy(dest_cr+ i*uvlinesize, h->mb + 160 + i*4,  8);
+                    }
                  }
              }
          }
@@ -1901,10 +1936,18 @@ static av_always_inline void hl_decode_mb_internal(H264Context *h, int simple, i
                  }
              }else{
                  if(is_h264){
+                    int qp[2];
+                    if (CHROMA422) {
+                        qp[0] = h->chroma_qp[0]+3;
+                        qp[1] = h->chroma_qp[1]+3;
+                    } else {
+                        qp[0] = h->chroma_qp[0];
+                        qp[1] = h->chroma_qp[1];
+                    }
                      if(h->non_zero_count_cache[ scan8[CHROMA_DC_BLOCK_INDEX+0] ])
-                        h->h264dsp.h264_chroma_dc_dequant_idct(h->mb + (16*16*1 << pixel_shift), h->dequant4_coeff[IS_INTRA(mb_type) ? 1:4][h->chroma_qp[0]][0]);
+                        h->h264dsp.h264_chroma_dc_dequant_idct(h->mb + (16*16*1 << pixel_shift), h->dequant4_coeff[IS_INTRA(mb_type) ? 1:4][qp[0]][0]);
                      if(h->non_zero_count_cache[ scan8[CHROMA_DC_BLOCK_INDEX+1] ])
-                        h->h264dsp.h264_chroma_dc_dequant_idct(h->mb + (16*16*2 << pixel_shift), h->dequant4_coeff[IS_INTRA(mb_type) ? 2:5][h->chroma_qp[1]][0]);
+                        h->h264dsp.h264_chroma_dc_dequant_idct(h->mb + (16*16*2 << pixel_shift), h->dequant4_coeff[IS_INTRA(mb_type) ? 2:5][qp[1]][0]);
                      h->h264dsp.h264_idct_add8(dest, block_offset,
                                                h->mb, uvlinesize,
                                                h->non_zero_count_cache);
@@ -2174,17 +2217,17 @@ static void implicit_weight_table(H264Context *h, int field){
      for(ref0=ref_start; ref0 < ref_count0; ref0++){
          int poc0 = h->ref_list[0][ref0].poc;
          for(ref1=ref_start; ref1 < ref_count1; ref1++){
-            int w= 32;
-            if (!h->ref_list[0][ref0].long_ref && !h->ref_list[1][ref1].long_ref){
-            int poc1 = h->ref_list[1][ref1].poc;
-            int td = av_clip(poc1 - poc0, -128, 127);
-            if(td){
-                int tb = av_clip(cur_poc - poc0, -128, 127);
-                int tx = (16384 + (FFABS(td) >> 1)) / td;
-                int dist_scale_factor = (tb*tx + 32) >> 8;
-                if(dist_scale_factor >= -64 && dist_scale_factor <= 128)
-                    w = 64 - dist_scale_factor;
-            }
+            int w = 32;
+            if (!h->ref_list[0][ref0].long_ref && !h->ref_list[1][ref1].long_ref) {
+                int poc1 = h->ref_list[1][ref1].poc;
+                int td = av_clip(poc1 - poc0, -128, 127);
+                if(td){
+                    int tb = av_clip(cur_poc - poc0, -128, 127);
+                    int tx = (16384 + (FFABS(td) >> 1)) / td;
+                    int dist_scale_factor = (tb*tx + 32) >> 8;
+                    if(dist_scale_factor >= -64 && dist_scale_factor <= 128)
+                        w = 64 - dist_scale_factor;
+                }
              }
              if(field<0){
                  h->implicit_weight[ref0][ref1][0]=
@@ -2211,7 +2254,7 @@ static void idr(H264Context *h){
  static void flush_dpb(AVCodecContext *avctx){
      H264Context *h= avctx->priv_data;
      int i;
-    for(i=0; i<MAX_DELAYED_PIC_COUNT; i++) {
+    for(i=0; i<=MAX_DELAYED_PIC_COUNT; i++) {
          if(h->delayed_pic[i])
              h->delayed_pic[i]->f.reference = 0;
          h->delayed_pic[i]= NULL;
@@ -2224,6 +2267,7 @@ static void flush_dpb(AVCodecContext *avctx){
      h->s.first_field= 0;
      ff_h264_reset_sei(h);
      ff_mpeg_flush(avctx);
+    h->sync= 0;
  }
  
  static int init_poc(H264Context *h){
@@ -2340,9 +2384,10 @@ static void init_scan_tables(H264Context *h){
      }
  }
  
-static void field_end(H264Context *h, int in_setup){
+static int field_end(H264Context *h, int in_setup){
      MpegEncContext * const s = &h->s;
      AVCodecContext * const avctx= s->avctx;
+    int err = 0;
      s->mb_y= 0;
  
      if (!in_setup && !s->dropable)
@@ -2354,7 +2399,7 @@ static void field_end(H264Context *h, int in_setup){
  
      if(in_setup || !(avctx->active_thread_type&FF_THREAD_FRAME)){
          if(!s->dropable) {
-            ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index);
+            err = ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index);
              h->prev_poc_msb= h->poc_msb;
              h->prev_poc_lsb= h->poc_lsb;
          }
@@ -2389,6 +2434,8 @@ static void field_end(H264Context *h, int in_setup){
      MPV_frame_end(s);
  
      h->current_slice=0;
+
+    return err;
  }
  
  /**
@@ -2539,11 +2586,13 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
  
      h->b_stride=  s->mb_width*4;
  
+    s->chroma_y_shift = h->sps.chroma_format_idc <= 1; // 400 uses yuv420p
+
      s->width = 16*s->mb_width - (2>>CHROMA444)*FFMIN(h->sps.crop_right, (8<<CHROMA444)-1);
      if(h->sps.frame_mbs_only_flag)
-        s->height= 16*s->mb_height - (2>>CHROMA444)*FFMIN(h->sps.crop_bottom, (8<<CHROMA444)-1);
+        s->height= 16*s->mb_height - (1<<s->chroma_y_shift)*FFMIN(h->sps.crop_bottom, (16>>s->chroma_y_shift)-1);
      else
-        s->height= 16*s->mb_height - (4>>CHROMA444)*FFMIN(h->sps.crop_bottom, (8<<CHROMA444)-1);
+        s->height= 16*s->mb_height - (2<<s->chroma_y_shift)*FFMIN(h->sps.crop_bottom, (16>>s->chroma_y_shift)-1);
  
      if (s->context_initialized
          && (   s->width != s->avctx->width || s->height != s->avctx->height
@@ -2566,9 +2615,6 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
          s->avctx->sample_aspect_ratio= h->sps.sar;
          av_assert0(s->avctx->sample_aspect_ratio.den);
  
-        h->s.avctx->coded_width = 16*s->mb_width;
-        h->s.avctx->coded_height = 16*s->mb_height;
-
          if(h->sps.video_signal_type_present_flag){
              s->avctx->color_range = h->sps.full_range ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
              if(h->sps.colour_description_present_flag){
@@ -2588,14 +2634,24 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
  
          switch (h->sps.bit_depth_luma) {
              case 9 :
-                s->avctx->pix_fmt = CHROMA444 ? PIX_FMT_YUV444P9 : PIX_FMT_YUV420P9;
+                if (CHROMA444)
+                    s->avctx->pix_fmt = PIX_FMT_YUV444P9;
+                else
+                    s->avctx->pix_fmt = PIX_FMT_YUV420P9;
                  break;
              case 10 :
-                s->avctx->pix_fmt = CHROMA444 ? PIX_FMT_YUV444P10 : PIX_FMT_YUV420P10;
+                if (CHROMA444)
+                    s->avctx->pix_fmt = PIX_FMT_YUV444P10;
+                else if (CHROMA422)
+                    s->avctx->pix_fmt = PIX_FMT_YUV422P10;
+                else
+                    s->avctx->pix_fmt = PIX_FMT_YUV420P10;
                  break;
              default:
                  if (CHROMA444){
                      s->avctx->pix_fmt = s->avctx->color_range == AVCOL_RANGE_JPEG ? PIX_FMT_YUVJ444P : PIX_FMT_YUV444P;
+                }else if (CHROMA422) {
+                    s->avctx->pix_fmt = s->avctx->color_range == AVCOL_RANGE_JPEG ? PIX_FMT_YUVJ422P : PIX_FMT_YUV422P;
                  }else{
                      s->avctx->pix_fmt = s->avctx->get_format(s->avctx,
                                                               s->avctx->codec->pix_fmts ?
@@ -2616,7 +2672,10 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
          h->prev_interlaced_frame = 1;
  
          init_scan_tables(h);
-        ff_h264_alloc_tables(h);
+        if (ff_h264_alloc_tables(h) < 0) {
+            av_log(h->s.avctx, AV_LOG_ERROR, "Could not allocate memory for h264\n");
+            return AVERROR(ENOMEM);
+        }
  
          if (!HAVE_THREADS || !(s->avctx->active_thread_type&FF_THREAD_SLICE)) {
              if (context_init(h) < 0) {
@@ -2690,7 +2749,9 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
              ff_thread_report_progress((AVFrame*)s->current_picture_ptr, INT_MAX, 0);
              ff_thread_report_progress((AVFrame*)s->current_picture_ptr, INT_MAX, 1);
              ff_generate_sliding_window_mmcos(h);
-            ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index);
+            if (ff_h264_execute_ref_pic_marking(h, h->mmco, h->mmco_index) < 0 &&
+                s->avctx->error_recognition >= FF_ER_EXPLODE)
+                return AVERROR_INVALIDDATA;
              /* Error concealment: if a ref is missing, copy the previous ref in its place.
               * FIXME: avoiding a memcpy would be nice, but ref handling makes many assumptions
               * about there being no actual duplicates.
@@ -2864,8 +2925,9 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
          }
      }
  
-    if(h->nal_ref_idc)
-        ff_h264_decode_ref_pic_marking(h0, &s->gb);
+    if(h->nal_ref_idc && ff_h264_decode_ref_pic_marking(h0, &s->gb) < 0 &&
+       s->avctx->error_recognition >= FF_ER_EXPLODE)
+        return AVERROR_INVALIDDATA;
  
      if(FRAME_MBAFF){
          ff_h264_fill_mbaff_ref_list(h);
@@ -2964,7 +3026,13 @@ static int decode_slice_header(H264Context *h, H264Context *h0){
  
      h0->last_slice_type = slice_type;
      h->slice_num = ++h0->current_slice;
-    if(h->slice_num >= MAX_SLICES){
+
+    if(h->slice_num)
+        h0->slice_row[(h->slice_num-1)&(MAX_SLICES-1)]= s->resync_mb_y;
+    if (   h0->slice_row[h->slice_num&(MAX_SLICES-1)] + 3 >= s->resync_mb_y
+        && h0->slice_row[h->slice_num&(MAX_SLICES-1)] <= s->resync_mb_y
+        && h->slice_num >= MAX_SLICES) {
+        //in case of ASO this check needs to be updated depending on how we decide to assign slice numbers in this case
          av_log(s->avctx, AV_LOG_WARNING, "Possibly too many slices (%d >= %d), increase MAX_SLICES and recompile if there are artifacts\n", h->slice_num, MAX_SLICES);
      }
  
@@ -3251,6 +3319,7 @@ static void loop_filter(H264Context *h, int start_x, int end_x){
      const int end_mb_y= s->mb_y + FRAME_MBAFF;
      const int old_slice_type= h->slice_type;
      const int pixel_shift = h->pixel_shift;
+    const int block_h = 16>>s->chroma_y_shift;
  
      if(h->deblocking_filter) {
          for(mb_x= start_x; mb_x<end_x; mb_x++){
@@ -3267,8 +3336,8 @@ static void loop_filter(H264Context *h, int start_x, int end_x){
                  s->mb_x= mb_x;
                  s->mb_y= mb_y;
                  dest_y  = s->current_picture.f.data[0] + ((mb_x << pixel_shift) + mb_y * s->linesize  ) * 16;
-                dest_cb = s->current_picture.f.data[1] + ((mb_x << pixel_shift) + mb_y * s->uvlinesize) * (8 << CHROMA444);
-                dest_cr = s->current_picture.f.data[2] + ((mb_x << pixel_shift) + mb_y * s->uvlinesize) * (8 << CHROMA444);
+                dest_cb = s->current_picture.f.data[1] + (mb_x << pixel_shift)*(8<<CHROMA444) + mb_y * s->uvlinesize * block_h;
+                dest_cr = s->current_picture.f.data[2] + (mb_x << pixel_shift)*(8<<CHROMA444) + mb_y * s->uvlinesize * block_h;
                      //FIXME simplify above
  
                  if (MB_FIELD) {
@@ -3276,14 +3345,14 @@ static void loop_filter(H264Context *h, int start_x, int end_x){
                      uvlinesize = h->mb_uvlinesize = s->uvlinesize * 2;
                      if(mb_y&1){ //FIXME move out of this function?
                          dest_y -= s->linesize*15;
-                        dest_cb-= s->uvlinesize*((8 << CHROMA444)-1);
-                        dest_cr-= s->uvlinesize*((8 << CHROMA444)-1);
+                        dest_cb-= s->uvlinesize*(block_h-1);
+                        dest_cr-= s->uvlinesize*(block_h-1);
                      }
                  } else {
                      linesize   = h->mb_linesize   = s->linesize;
                      uvlinesize = h->mb_uvlinesize = s->uvlinesize;
                  }
-                backup_mb_border(h, dest_y, dest_cb, dest_cr, linesize, uvlinesize, CHROMA444, 0);
+                backup_mb_border(h, dest_y, dest_cb, dest_cr, linesize, uvlinesize, 0);
                  if(fill_filter_caches(h, mb_type))
                      continue;
                  h->chroma_qp[0] = get_chroma_qp(h, 0, s->current_picture.f.qscale_table[mb_xy]);
@@ -3490,18 +3559,16 @@ static int decode_slice(struct AVCodecContext *avctx, void *arg){
   * @param h h264 master context
   * @param context_count number of contexts to execute
   */
-static void execute_decode_slices(H264Context *h, int context_count){
+static int execute_decode_slices(H264Context *h, int context_count){
      MpegEncContext * const s = &h->s;
      AVCodecContext * const avctx= s->avctx;
      H264Context *hx;
      int i;
  
-    if (s->avctx->hwaccel)
-        return;
-    if(s->avctx->codec->capabilities&CODEC_CAP_HWACCEL_VDPAU)
-        return;
+    if (s->avctx->hwaccel || s->avctx->codec->capabilities&CODEC_CAP_HWACCEL_VDPAU)
+        return 0;
      if(context_count == 1) {
-        decode_slice(avctx, &h);
+        return decode_slice(avctx, &h);
      } else {
          for(i = 1; i < context_count; i++) {
              hx = h->thread_context[i];
@@ -3522,6 +3589,8 @@ static void execute_decode_slices(H264Context *h, int context_count){
          for(i = 1; i < context_count; i++)
              h->s.error_count += h->thread_context[i]->s.error_count;
      }
+
+    return 0;
  }
  
  
@@ -3593,7 +3662,7 @@ static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size){
              s->workaround_bugs |= FF_BUG_TRUNCATED;
  
          if(!(s->workaround_bugs & FF_BUG_TRUNCATED)){
-        while(ptr[dst_length - 1] == 0 && dst_length > 0)
+        while(dst_length > 0 && ptr[dst_length - 1] == 0)
              dst_length--;
          }
          bit_length= !dst_length ? 0 : (8*dst_length - ff_h264_decode_rbsp_trailing(h, ptr + dst_length - 1));
@@ -3648,6 +3717,9 @@ static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size){
              s->current_picture_ptr->f.key_frame |=
                      (hx->nal_unit_type == NAL_IDR_SLICE) ||
                      (h->sei_recovery_frame_cnt >= 0);
+            h->sync |= !!s->current_picture_ptr->f.key_frame;
+            h->sync |= 3*!!(s->flags2 & CODEC_FLAG2_SHOW_ALL);
+            s->current_picture_ptr->sync = h->sync;
  
              if (h->current_slice == 1) {
                  if(!(s->flags2 & CODEC_FLAG2_CHUNKS)) {
@@ -3719,13 +3791,15 @@ static int decode_nal_units(H264Context *h, const uint8_t *buf, int buf_size){
              if(avctx->has_b_frames < 2)
                  avctx->has_b_frames= !s->low_delay;
  
-            if (avctx->bits_per_raw_sample != h->sps.bit_depth_luma) {
+            if (avctx->bits_per_raw_sample != h->sps.bit_depth_luma ||
+                h->cur_chroma_format_idc != h->sps.chroma_format_idc) {
                  if (h->sps.bit_depth_luma >= 8 && h->sps.bit_depth_luma <= 10) {
                      avctx->bits_per_raw_sample = h->sps.bit_depth_luma;
+                    h->cur_chroma_format_idc = h->sps.chroma_format_idc;
                      h->pixel_shift = h->sps.bit_depth_luma > 8;
  
-                    ff_h264dsp_init(&h->h264dsp, h->sps.bit_depth_luma);
-                    ff_h264_pred_init(&h->hpc, s->codec_id, h->sps.bit_depth_luma);
+                    ff_h264dsp_init(&h->h264dsp, h->sps.bit_depth_luma, h->sps.chroma_format_idc);
+                    ff_h264_pred_init(&h->hpc, s->codec_id, h->sps.bit_depth_luma, h->sps.chroma_format_idc);
                      s->dsp.dct_bits = h->sps.bit_depth_luma > 8 ? 32 : 16;
                      dsputil_init(&s->dsp, s->avctx);
                  } else {
@@ -3849,13 +3923,12 @@ static int decode_frame(AVCodecContext *avctx,
  
          field_end(h, 0);
  
-        if (!h->next_output_pic) {
-            /* Wait for second field. */
-            *data_size = 0;
-
-        } else {
-            *data_size = sizeof(AVFrame);
-            *pict = *(AVFrame*)h->next_output_pic;
+        *data_size = 0; /* Wait for second field. */
+        if (h->next_output_pic && h->next_output_pic->sync) {
+            if(h->sync>1 || h->next_output_pic->f.pict_type != AV_PICTURE_TYPE_B){
+                *data_size = sizeof(AVFrame);
+                *pict = *(AVFrame*)h->next_output_pic;
+            }
          }
      }