mini-fix for compatibility with other compilers by (Hauke Duden <H.NS.Duden at gmx...

[ffmpeg] / libavcodec / mpegvideo.c
diff --git a/libavcodec/mpegvideo.c b/libavcodec/mpegvideo.c

index b65b65f3e109afd1720602ce63fe5e4873a5c713..e28d9b309bfc748e922a92ba873ac4cc4d1cead6 100644 (file)
--- a/libavcodec/mpegvideo.c
+++ b/libavcodec/mpegvideo.c
@@ -25,12 +25,11 @@
   * The simplest mpeg encoder (well, it was the simplest!).
   */ 
   
-#include <limits.h>
-#include <math.h> //for PI
  #include "avcodec.h"
  #include "dsputil.h"
  #include "mpegvideo.h"
  #include "faandct.h"
+#include <limits.h>
  
  #ifdef USE_FASTMEMCPY
  #include "fastmemcpy.h"
@@ -54,6 +53,10 @@ static void dct_unquantize_h263_intra_c(MpegEncContext *s,
                                    DCTELEM *block, int n, int qscale);
  static void dct_unquantize_h263_inter_c(MpegEncContext *s, 
                                    DCTELEM *block, int n, int qscale);
+static void dct_unquantize_h261_intra_c(MpegEncContext *s, 
+                                  DCTELEM *block, int n, int qscale);
+static void dct_unquantize_h261_inter_c(MpegEncContext *s, 
+                                  DCTELEM *block, int n, int qscale);
  static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w);
  #ifdef CONFIG_ENCODERS
  static int dct_quantize_c(MpegEncContext *s, DCTELEM *block, int n, int qscale, int *overflow);
@@ -216,6 +219,8 @@ int DCT_common_init(MpegEncContext *s)
  {
      s->dct_unquantize_h263_intra = dct_unquantize_h263_intra_c;
      s->dct_unquantize_h263_inter = dct_unquantize_h263_inter_c;
+    s->dct_unquantize_h261_intra = dct_unquantize_h261_intra_c;
+    s->dct_unquantize_h261_inter = dct_unquantize_h261_inter_c;
      s->dct_unquantize_mpeg1_intra = dct_unquantize_mpeg1_intra_c;
      s->dct_unquantize_mpeg1_inter = dct_unquantize_mpeg1_inter_c;
      s->dct_unquantize_mpeg2_intra = dct_unquantize_mpeg2_intra_c;
@@ -267,8 +272,6 @@ int DCT_common_init(MpegEncContext *s)
      ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
      ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  
-    s->picture_structure= PICT_FRAME;
-    
      return 0;
  }
  
@@ -277,7 +280,9 @@ static void copy_picture(Picture *dst, Picture *src){
      dst->type= FF_BUFFER_TYPE_COPY;
  }
  
-static void copy_picture_attributes(AVFrame *dst, AVFrame *src){
+static void copy_picture_attributes(MpegEncContext *s, AVFrame *dst, AVFrame *src){
+    int i;
+
      dst->pict_type              = src->pict_type;
      dst->quality                = src->quality;
      dst->coded_picture_number   = src->coded_picture_number;
@@ -286,6 +291,32 @@ static void copy_picture_attributes(AVFrame *dst, AVFrame *src){
      dst->pts                    = src->pts;
      dst->interlaced_frame       = src->interlaced_frame;
      dst->top_field_first        = src->top_field_first;
+
+    if(s->avctx->me_threshold){
+        if(!src->motion_val[0])
+            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.motion_val not set!\n");
+        if(!src->mb_type)
+            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.mb_type not set!\n");
+        if(!src->ref_index[0])
+            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.ref_index not set!\n");
+        if(src->motion_subsample_log2 != dst->motion_subsample_log2)
+            av_log(s->avctx, AV_LOG_ERROR, "AVFrame.motion_subsample_log2 doesnt match! (%d!=%d)\n",
+            src->motion_subsample_log2, dst->motion_subsample_log2);
+
+        memcpy(dst->mb_type, src->mb_type, s->mb_stride * s->mb_height * sizeof(dst->mb_type[0]));
+        
+        for(i=0; i<2; i++){
+            int stride= ((16*s->mb_width )>>src->motion_subsample_log2) + 1;
+            int height= ((16*s->mb_height)>>src->motion_subsample_log2);
+
+            if(src->motion_val[i] && src->motion_val[i] != dst->motion_val[i]){
+                memcpy(dst->motion_val[i], src->motion_val[i], 2*stride*height*sizeof(int16_t));
+            }
+            if(src->ref_index[i] && src->ref_index[i] != dst->ref_index[i]){
+                memcpy(dst->ref_index[i], src->ref_index[i], s->b8_stride*2*s->mb_height*sizeof(int8_t));
+            }
+        }
+    }
  }
  
  /**
@@ -342,18 +373,22 @@ static int alloc_picture(MpegEncContext *s, Picture *pic, int shared){
          pic->mb_type= pic->mb_type_base + s->mb_stride+1;
          if(s->out_format == FMT_H264){
              for(i=0; i<2; i++){
-                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b4_array_size+1)  * sizeof(int16_t))
-                pic->motion_val[i]= pic->motion_val_base[i]+1;
-                CHECKED_ALLOCZ(pic->ref_index[i] , b8_array_size * sizeof(uint8_t))
+                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b4_array_size+2)  * sizeof(int16_t))
+                pic->motion_val[i]= pic->motion_val_base[i]+2;
+                CHECKED_ALLOCZ(pic->ref_index[i], b8_array_size * sizeof(uint8_t))
              }
              pic->motion_subsample_log2= 2;
          }else if(s->out_format == FMT_H263 || s->encoding || (s->avctx->debug&FF_DEBUG_MV) || (s->avctx->debug_mv)){
              for(i=0; i<2; i++){
-                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b8_array_size+1) * sizeof(int16_t)*2) //FIXME
-                pic->motion_val[i]= pic->motion_val_base[i]+1;
+                CHECKED_ALLOCZ(pic->motion_val_base[i], 2 * (b8_array_size+2) * sizeof(int16_t))
+                pic->motion_val[i]= pic->motion_val_base[i]+2;
+                CHECKED_ALLOCZ(pic->ref_index[i], b8_array_size * sizeof(uint8_t))
              }
              pic->motion_subsample_log2= 3;
          }
+        if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
+            CHECKED_ALLOCZ(pic->dct_coeff, 64 * mb_array_size * sizeof(DCTELEM)*6)
+        }
          pic->qstride= s->mb_stride;
          CHECKED_ALLOCZ(pic->pan_scan , 1 * sizeof(AVPanScan))
      }
@@ -385,6 +420,7 @@ static void free_picture(MpegEncContext *s, Picture *pic){
      av_freep(&pic->mbskip_table);
      av_freep(&pic->qscale_table);
      av_freep(&pic->mb_type_base);
+    av_freep(&pic->dct_coeff);
      av_freep(&pic->pan_scan);
      pic->mb_type= NULL;
      for(i=0; i<2; i++){
@@ -404,11 +440,12 @@ static void free_picture(MpegEncContext *s, Picture *pic){
  static int init_duplicate_context(MpegEncContext *s, MpegEncContext *base){
      int i;
  
+    // edge emu needs blocksize + filter length - 1 (=17x17 for halfpel / 21x21 for h264) 
      CHECKED_ALLOCZ(s->allocated_edge_emu_buffer, (s->width+64)*2*17*2); //(width + edge + align)*interlaced*MBsize*tolerance
      s->edge_emu_buffer= s->allocated_edge_emu_buffer + (s->width+64)*2*17;
  
       //FIXME should be linesize instead of s->width*2 but that isnt known before get_buffer()
-    CHECKED_ALLOCZ(s->me.scratchpad,  s->width*2*16*2*sizeof(uint8_t)) 
+    CHECKED_ALLOCZ(s->me.scratchpad,  (s->width+64)*2*16*2*sizeof(uint8_t)) 
      s->rd_scratchpad=   s->me.scratchpad;
      s->b_scratchpad=    s->me.scratchpad;
      s->obmc_scratchpad= s->me.scratchpad + 16;
@@ -419,7 +456,7 @@ static int init_duplicate_context(MpegEncContext *s, MpegEncContext *base){
              CHECKED_ALLOCZ(s->dct_error_sum, 2 * 64 * sizeof(int))
          }
      }   
-    CHECKED_ALLOCZ(s->blocks, 64*6*2 * sizeof(DCTELEM))
+    CHECKED_ALLOCZ(s->blocks, 64*12*2 * sizeof(DCTELEM))
      s->block= s->blocks[0];
  
      for(i=0;i<12;i++){
@@ -463,16 +500,22 @@ static void backup_duplicate_context(MpegEncContext *bak, MpegEncContext *src){
      COPY(me.map_generation);
      COPY(pb);
      COPY(dct_error_sum);
+    COPY(dct_count[0]);
+    COPY(dct_count[1]);
  #undef COPY
  }
  
-static void update_duplicate_context(MpegEncContext *dst, MpegEncContext *src){
+void ff_update_duplicate_context(MpegEncContext *dst, MpegEncContext *src){
      MpegEncContext bak;
+    int i;
      //FIXME copy only needed parts
  //START_TIMER
      backup_duplicate_context(&bak, dst);
      memcpy(dst, src, sizeof(MpegEncContext));
      backup_duplicate_context(dst, &bak);
+    for(i=0;i<12;i++){
+        dst->pblocks[i] = (short *)(&dst->block[i]);
+    }
  //STOP_TIMER("update_duplicate_context") //about 10k cycles / 0.01 sec for 1000frames on 1ghz with 2 threads
  }
  
@@ -493,11 +536,77 @@ static void update_duplicate_context_after_me(MpegEncContext *dst, MpegEncContex
  #undef COPY
  }
  
-/* init common structure for both encoder and decoder */
+/**
+ * sets the given MpegEncContext to common defaults (same for encoding and decoding).
+ * the changed fields will not depend upon the prior state of the MpegEncContext.
+ */
+static void MPV_common_defaults(MpegEncContext *s){
+    s->y_dc_scale_table=
+    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
+    s->chroma_qscale_table= ff_default_chroma_qscale_table;
+    s->progressive_frame= 1;
+    s->progressive_sequence= 1;
+    s->picture_structure= PICT_FRAME;
+
+    s->coded_picture_number = 0;
+    s->picture_number = 0;
+    s->input_picture_number = 0;
+
+    s->picture_in_gop_number = 0;
+
+    s->f_code = 1;
+    s->b_code = 1;
+}
+
+/**
+ * sets the given MpegEncContext to defaults for decoding.
+ * the changed fields will not depend upon the prior state of the MpegEncContext.
+ */
+void MPV_decode_defaults(MpegEncContext *s){
+    MPV_common_defaults(s);
+}
+
+/**
+ * sets the given MpegEncContext to defaults for encoding.
+ * the changed fields will not depend upon the prior state of the MpegEncContext.
+ */
+
+#ifdef CONFIG_ENCODERS
+static void MPV_encode_defaults(MpegEncContext *s){
+    static int done=0;
+    
+    MPV_common_defaults(s);
+    
+    if(!done){
+        int i;
+        done=1;
+
+        default_mv_penalty= av_mallocz( sizeof(uint8_t)*(MAX_FCODE+1)*(2*MAX_MV+1) );
+        memset(default_mv_penalty, 0, sizeof(uint8_t)*(MAX_FCODE+1)*(2*MAX_MV+1));
+        memset(default_fcode_tab , 0, sizeof(uint8_t)*(2*MAX_MV+1));
+
+        for(i=-16; i<16; i++){
+            default_fcode_tab[i + MAX_MV]= 1;
+        }
+    }
+    s->me.mv_penalty= default_mv_penalty;
+    s->fcode_tab= default_fcode_tab;
+}
+#endif //CONFIG_ENCODERS
+
+/** 
+ * init common structure for both encoder and decoder.
+ * this assumes that some variables like width/height are already set
+ */
  int MPV_common_init(MpegEncContext *s)
  {
      int y_size, c_size, yc_size, i, mb_array_size, mv_table_size, x, y;
  
+    if(s->avctx->thread_count > MAX_THREADS || (16*s->avctx->thread_count > s->height && s->height)){
+        av_log(s->avctx, AV_LOG_ERROR, "too many threads\n");
+        return -1;
+    }
+
      dsputil_init(&s->dsp, s->avctx);
      DCT_common_init(s);
  
@@ -521,22 +630,14 @@ int MPV_common_init(MpegEncContext *s)
      s->block_wrap[0]=
      s->block_wrap[1]=
      s->block_wrap[2]=
-    s->block_wrap[3]= s->mb_width*2 + 2;
+    s->block_wrap[3]= s->b8_stride;
      s->block_wrap[4]=
-    s->block_wrap[5]= s->mb_width + 2;
-
-    s->y_dc_scale_table=
-    s->c_dc_scale_table= ff_mpeg1_dc_scale_table;
-    s->chroma_qscale_table= ff_default_chroma_qscale_table;
-    if (!s->encoding)
-        s->progressive_sequence= 1;
-    s->progressive_frame= 1;
-    s->coded_picture_number = 0;
-
-    y_size = (2 * s->mb_width + 2) * (2 * s->mb_height + 2);
-    c_size = (s->mb_width + 2) * (s->mb_height + 2);
+    s->block_wrap[5]= s->mb_stride;
+ 
+    y_size = s->b8_stride * (2 * s->mb_height + 1);
+    c_size = s->mb_stride * (s->mb_height + 1);
      yc_size = y_size + 2 * c_size;
-
+    
      /* convert fourcc to upper case */
      s->avctx->codec_tag=   toupper( s->avctx->codec_tag     &0xFF)          
                          + (toupper((s->avctx->codec_tag>>8 )&0xFF)<<8 )
@@ -616,12 +717,14 @@ int MPV_common_init(MpegEncContext *s)
      }
      if (s->out_format == FMT_H263) {
          /* ac values */
-        CHECKED_ALLOCZ(s->ac_val[0], yc_size * sizeof(int16_t) * 16);
-        s->ac_val[1] = s->ac_val[0] + y_size;
+        CHECKED_ALLOCZ(s->ac_val_base, yc_size * sizeof(int16_t) * 16);
+        s->ac_val[0] = s->ac_val_base + s->b8_stride + 1;
+        s->ac_val[1] = s->ac_val_base + y_size + s->mb_stride + 1;
          s->ac_val[2] = s->ac_val[1] + c_size;
          
          /* cbp values */
-        CHECKED_ALLOCZ(s->coded_block, y_size);
+        CHECKED_ALLOCZ(s->coded_block_base, y_size);
+        s->coded_block= s->coded_block_base + s->b8_stride + 1;
          
          /* divx501 bitstream reorder buffer */
          CHECKED_ALLOCZ(s->bitstream_buffer, BITSTREAM_BUFFER_SIZE);
@@ -634,20 +737,18 @@ int MPV_common_init(MpegEncContext *s)
      if (s->h263_pred || s->h263_plus || !s->encoding) {
          /* dc values */
          //MN: we need these for error resilience of intra-frames
-        CHECKED_ALLOCZ(s->dc_val[0], yc_size * sizeof(int16_t));
-        s->dc_val[1] = s->dc_val[0] + y_size;
+        CHECKED_ALLOCZ(s->dc_val_base, yc_size * sizeof(int16_t));
+        s->dc_val[0] = s->dc_val_base + s->b8_stride + 1;
+        s->dc_val[1] = s->dc_val_base + y_size + s->mb_stride + 1;
          s->dc_val[2] = s->dc_val[1] + c_size;
          for(i=0;i<yc_size;i++)
-            s->dc_val[0][i] = 1024;
+            s->dc_val_base[i] = 1024;
      }
  
      /* which mb is a intra block */
      CHECKED_ALLOCZ(s->mbintra_table, mb_array_size);
      memset(s->mbintra_table, 1, mb_array_size);
      
-    /* default structure is frame */
-    s->picture_structure = PICT_FRAME;
-    
      /* init macroblock skip table */
      CHECKED_ALLOCZ(s->mbskip_table, mb_array_size+2);
      //Note the +1 is for a quicker mpeg4 slice_end detection
@@ -722,9 +823,9 @@ void MPV_common_end(MpegEncContext *s)
          av_freep(&s->p_field_select_table[i]);
      }
      
-    av_freep(&s->dc_val[0]);
-    av_freep(&s->ac_val[0]);
-    av_freep(&s->coded_block);
+    av_freep(&s->dc_val_base);
+    av_freep(&s->ac_val_base);
+    av_freep(&s->coded_block_base);
      av_freep(&s->mbintra_table);
      av_freep(&s->cbp_table);
      av_freep(&s->pred_dir_table);
@@ -743,7 +844,6 @@ void MPV_common_end(MpegEncContext *s)
      av_freep(&s->q_inter_matrix16);
      av_freep(&s->input_picture);
      av_freep(&s->reordered_input_picture);
-    av_freep(&s->dct_error_sum);
      av_freep(&s->dct_offset);
  
      if(s->picture){
@@ -752,14 +852,13 @@ void MPV_common_end(MpegEncContext *s)
          }
      }
      av_freep(&s->picture);
-    avcodec_default_free_buffers(s->avctx);
      s->context_initialized = 0;
      s->last_picture_ptr=
      s->next_picture_ptr=
      s->current_picture_ptr= NULL;
+
      for(i=0; i<3; i++)
-        if (s->visualization_buffer[i])
-            av_free(s->visualization_buffer[i]);
+        av_freep(&s->visualization_buffer[i]);
  }
  
  #ifdef CONFIG_ENCODERS
@@ -770,6 +869,8 @@ int MPV_encode_init(AVCodecContext *avctx)
      MpegEncContext *s = avctx->priv_data;
      int i, dummy;
      int chroma_h_shift, chroma_v_shift;
+    
+    MPV_encode_defaults(s);
  
      avctx->pix_fmt = PIX_FMT_YUV420P; // FIXME
  
@@ -793,6 +894,7 @@ int MPV_encode_init(AVCodecContext *avctx)
      s->quarter_sample= (avctx->flags & CODEC_FLAG_QPEL)!=0;
      s->mpeg_quant= avctx->mpeg_quant;
      s->rtp_mode= !!avctx->rtp_payload_size;
+    s->intra_dc_precision= avctx->intra_dc_precision;
  
      if (s->gop_size <= 1) {
          s->intra_only = 1;
@@ -825,8 +927,15 @@ int MPV_encode_init(AVCodecContext *avctx)
  
      if(avctx->rc_min_rate && avctx->rc_max_rate != avctx->rc_min_rate){
          av_log(avctx, AV_LOG_INFO, "Warning min_rate > 0 but min_rate != max_rate isnt recommanded!\n");
-    }    
+    }
+    
+    if(   s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate 
+       && (s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO)
+       && 90000LL * (avctx->rc_buffer_size-1) > s->avctx->rc_max_rate*0xFFFFLL){
          
+        av_log(avctx, AV_LOG_INFO, "Warning vbv_delay will be set to 0xFFFF (=VBR) as the specified vbv buffer is too large for the given bitrate!\n");
+    }
+       
      if((s->flags & CODEC_FLAG_4MV) && s->codec_id != CODEC_ID_MPEG4 
         && s->codec_id != CODEC_ID_H263 && s->codec_id != CODEC_ID_H263P && s->codec_id != CODEC_ID_FLV1){
          av_log(avctx, AV_LOG_ERROR, "4MV not supported by codec\n");
@@ -857,7 +966,13 @@ int MPV_encode_init(AVCodecContext *avctx)
          av_log(avctx, AV_LOG_ERROR, "b frames not supported by codec\n");
          return -1;
      }
-    
+
+    if((s->flags & (CODEC_FLAG_INTERLACED_DCT|CODEC_FLAG_INTERLACED_ME|CODEC_FLAG_ALT_SCAN)) 
+       && s->codec_id != CODEC_ID_MPEG4 && s->codec_id != CODEC_ID_MPEG2VIDEO){
+        av_log(avctx, AV_LOG_ERROR, "interlacing not supported by codec\n");
+        return -1;
+    }
+        
      if(s->mpeg_quant && s->codec_id != CODEC_ID_MPEG4){ //FIXME mpeg2 uses that too
          av_log(avctx, AV_LOG_ERROR, "mpeg2 style quantization not supporetd by codec\n");
          return -1;
@@ -1047,28 +1162,8 @@ int MPV_encode_init(AVCodecContext *avctx)
      default:
          return -1;
      }
-
-    { /* set up some save defaults, some codecs might override them later */
-        static int done=0;
-        if(!done){
-            int i;
-            done=1;
-
-            default_mv_penalty= av_mallocz( sizeof(uint8_t)*(MAX_FCODE+1)*(2*MAX_MV+1) );
-            memset(default_mv_penalty, 0, sizeof(uint8_t)*(MAX_FCODE+1)*(2*MAX_MV+1));
-            memset(default_fcode_tab , 0, sizeof(uint8_t)*(2*MAX_MV+1));
-
-            for(i=-16; i<16; i++){
-                default_fcode_tab[i + MAX_MV]= 1;
-            }
-        }
-    }
-    s->me.mv_penalty= default_mv_penalty;
-    s->fcode_tab= default_fcode_tab;
- 
-    /* dont use mv_penalty table for crap MV as it would be confused */
-    //FIXME remove after fixing / removing old ME
-    if (s->me_method < ME_EPZS) s->me.mv_penalty = default_mv_penalty;
+    
+    avctx->has_b_frames= !s->low_delay;
  
      s->encoding = 1;
  
@@ -1084,8 +1179,6 @@ int MPV_encode_init(AVCodecContext *avctx)
      
      ff_set_cmp(&s->dsp, s->dsp.ildct_cmp, s->avctx->ildct_cmp);
      
-    ff_init_me(s);
-
  #ifdef CONFIG_ENCODERS
  #ifdef CONFIG_RISKY
      if (s->out_format == FMT_H263)
@@ -1097,7 +1190,7 @@ int MPV_encode_init(AVCodecContext *avctx)
          ff_mpeg1_encode_init(s);
  #endif
  
-    /* init default q matrix */
+    /* init q matrix */
      for(i=0;i<64;i++) {
          int j= s->dsp.idct_permutation[i];
  #ifdef CONFIG_RISKY
@@ -1130,14 +1223,7 @@ int MPV_encode_init(AVCodecContext *avctx)
  
      if(ff_rate_control_init(s) < 0)
          return -1;
-
-    s->picture_number = 0;
-    s->input_picture_number = 0;
-    s->picture_in_gop_number = 0;
-    /* motion detector init */
-    s->f_code = 1;
-    s->b_code = 1;
-
+    
      return 0;
  }
  
@@ -1278,7 +1364,7 @@ int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx)
      assert(s->last_picture_ptr==NULL || s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3);
  
      /* mark&release old frames */
-    if (s->pict_type != B_TYPE && s->last_picture_ptr && s->last_picture_ptr->data[0]) {
+    if (s->pict_type != B_TYPE && s->last_picture_ptr && s->last_picture_ptr != s->next_picture_ptr && s->last_picture_ptr->data[0]) {
          avctx->release_buffer(avctx, (AVFrame*)s->last_picture_ptr);
  
          /* release forgotten pictures */
@@ -1308,7 +1394,7 @@ alloc:
              pic= (AVFrame*)&s->picture[i];
          }
  
-        pic->reference= s->pict_type != B_TYPE ? 3 : 0;
+        pic->reference= s->pict_type != B_TYPE && !s->dropable ? 3 : 0;
  
          pic->coded_picture_number= s->coded_picture_number++;
          
@@ -1330,8 +1416,14 @@ alloc:
    if(s->out_format != FMT_H264 || s->codec_id == CODEC_ID_SVQ3){
      if (s->pict_type != B_TYPE) {
          s->last_picture_ptr= s->next_picture_ptr;
-        s->next_picture_ptr= s->current_picture_ptr;
+        if(!s->dropable)
+            s->next_picture_ptr= s->current_picture_ptr;
      }
+/*    av_log(s->avctx, AV_LOG_DEBUG, "L%p N%p C%p L%p N%p C%p type:%d drop:%d\n", s->last_picture_ptr, s->next_picture_ptr,s->current_picture_ptr,
+        s->last_picture_ptr    ? s->last_picture_ptr->data[0] : NULL, 
+        s->next_picture_ptr    ? s->next_picture_ptr->data[0] : NULL, 
+        s->current_picture_ptr ? s->current_picture_ptr->data[0] : NULL,
+        s->pict_type, s->dropable);*/
      
      if(s->last_picture_ptr) copy_picture(&s->last_picture, s->last_picture_ptr);
      if(s->next_picture_ptr) copy_picture(&s->next_picture, s->next_picture_ptr);
@@ -1368,6 +1460,9 @@ alloc:
      }else if(s->out_format == FMT_H263){
          s->dct_unquantize_intra = s->dct_unquantize_h263_intra;
          s->dct_unquantize_inter = s->dct_unquantize_h263_inter;
+    }else if(s->out_format == FMT_H261){
+        s->dct_unquantize_intra = s->dct_unquantize_h261_intra;
+        s->dct_unquantize_inter = s->dct_unquantize_h261_inter;
      }else{
          s->dct_unquantize_intra = s->dct_unquantize_mpeg1_intra;
          s->dct_unquantize_inter = s->dct_unquantize_mpeg1_inter;
@@ -1443,7 +1538,7 @@ void MPV_frame_end(MpegEncContext *s)
   * @param color color of the arrow
   */
  static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h, int stride, int color){
-    int t, x, y, f;
+    int t, x, y, fr, f;
      
      sx= clip(sx, 0, w-1);
      sy= clip(sy, 0, h-1);
@@ -1461,8 +1556,10 @@ static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h
          ex-= sx;
          f= ((ey-sy)<<16)/ex;
          for(x= 0; x <= ex; x++){
-            y= ((x*f) + (1<<15))>>16;
-            buf[y*stride + x]+= color;
+            y = (x*f)>>16;
+            fr= (x*f)&0xFFFF;
+            buf[ y   *stride + x]+= (color*(0x10000-fr))>>16;
+            buf[(y+1)*stride + x]+= (color*         fr )>>16;
          }
      }else{
          if(sy > ey){
@@ -1474,8 +1571,10 @@ static void draw_line(uint8_t *buf, int sx, int sy, int ex, int ey, int w, int h
          if(ey) f= ((ex-sx)<<16)/ey;
          else   f= 0;
          for(y= 0; y <= ey; y++){
-            x= ((y*f) + (1<<15))>>16;
-            buf[y*stride + x]+= color;
+            x = (y*f)>>16;
+            fr= (y*f)&0xFFFF;
+            buf[y*stride + x  ]+= (color*(0x10000-fr))>>16;;
+            buf[y*stride + x+1]+= (color*         fr )>>16;;
          }
      }
  }
@@ -1619,7 +1718,7 @@ void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
                  if((s->avctx->debug_mv) && pict->motion_val){
                    int type;
                    for(type=0; type<3; type++){
-                    int direction;
+                    int direction = 0;
                      switch (type) {
                        case 0: if ((!(s->avctx->debug_mv&FF_DEBUG_VIS_MV_P_FOR)) || (pict->pict_type!=FF_P_TYPE))
                                  continue;
@@ -1637,12 +1736,13 @@ void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
                      if(!USES_LIST(pict->mb_type[mb_index], direction))
                          continue;
  
+                    //FIXME for h264
                      if(IS_8X8(pict->mb_type[mb_index])){
                        int i;
                        for(i=0; i<4; i++){
                          int sx= mb_x*16 + 4 + 8*(i&1);
                          int sy= mb_y*16 + 4 + 8*(i>>1);
-                        int xy= 1 + mb_x*2 + (i&1) + (mb_y*2 + 1 + (i>>1))*(s->mb_width*2 + 2);
+                        int xy= mb_x*2 + (i&1) + (mb_y*2 + (i>>1))*s->b8_stride;
                          int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                          int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
                          draw_arrow(ptr, sx, sy, mx, my, s->width, s->height, s->linesize, 100);
@@ -1652,15 +1752,19 @@ void ff_print_debug_info(MpegEncContext *s, AVFrame *pict){
                        for(i=0; i<2; i++){
                          int sx=mb_x*16 + 8;
                          int sy=mb_y*16 + 4 + 8*i;
-                        int xy=1 + mb_x*2 + (mb_y*2 + 1 + i)*(s->mb_width*2 + 2);
-                        int mx=(pict->motion_val[direction][xy][0]>>shift) + sx;
-                        int my=(pict->motion_val[direction][xy][1]>>shift) + sy;
-                        draw_arrow(ptr, sx, sy, mx, my, s->width, s->height, s->linesize, 100);
+                        int xy= mb_x*2 + (mb_y*2 + i)*s->b8_stride;
+                        int mx=(pict->motion_val[direction][xy][0]>>shift);
+                        int my=(pict->motion_val[direction][xy][1]>>shift);
+                        
+                        if(IS_INTERLACED(pict->mb_type[mb_index]))
+                            my*=2;
+                        
+                        draw_arrow(ptr, sx, sy, mx+sx, my+sy, s->width, s->height, s->linesize, 100);
                        }
                      }else{
                        int sx= mb_x*16 + 8;
                        int sy= mb_y*16 + 8;
-                      int xy= 1 + mb_x*2 + (mb_y*2 + 1)*(s->mb_width*2 + 2);
+                      int xy= mb_x*2 + mb_y*2*s->b8_stride;
                        int mx= (pict->motion_val[direction][xy][0]>>shift) + sx;
                        int my= (pict->motion_val[direction][xy][1]>>shift) + sy;
                        draw_arrow(ptr, sx, sy, mx, my, s->width, s->height, s->linesize, 100);
@@ -1837,11 +1941,21 @@ static int load_input_picture(MpegEncContext *s, AVFrame *pic_arg){
              }
          }
      }
-    copy_picture_attributes(pic, pic_arg);
+    copy_picture_attributes(s, pic, pic_arg);
      
      pic->display_picture_number= s->input_picture_number++;
+    if(pic->pts != AV_NOPTS_VALUE){ 
+        s->user_specified_pts= pic->pts;
+    }else{
+        if(s->user_specified_pts){
+            pic->pts= s->user_specified_pts + AV_TIME_BASE*(int64_t)s->avctx->frame_rate_base / s->avctx->frame_rate;
+            av_log(s->avctx, AV_LOG_INFO, "Warning: AVFrame.pts=? trying to guess (%Ld)\n", pic->pts);
+        }else{
+            pic->pts= av_rescale(pic->display_picture_number*(int64_t)s->avctx->frame_rate_base, AV_TIME_BASE, s->avctx->frame_rate);
+        }
+    }
    }
-
+  
      /* shift buffer entries */
      for(i=1; i<MAX_PICTURE_COUNT /*s->encoding_delay+1*/; i++)
          s->input_picture[i-1]= s->input_picture[i];
@@ -1956,11 +2070,12 @@ static void select_input_picture(MpegEncContext *s){
                  s->reordered_input_picture[0]->data[i]= NULL;
              s->reordered_input_picture[0]->type= 0;
              
-            copy_picture_attributes((AVFrame*)pic, (AVFrame*)s->reordered_input_picture[0]);
              pic->reference              = s->reordered_input_picture[0]->reference;
              
              alloc_picture(s, pic, 0);
  
+            copy_picture_attributes(s, (AVFrame*)pic, (AVFrame*)s->reordered_input_picture[0]);
+
              s->current_picture_ptr= pic;
          }else{
              // input is not a shared pix -> reuse buffer for current_pix
@@ -1995,10 +2110,11 @@ int MPV_encode_picture(AVCodecContext *avctx,
      }
      
      for(i=0; i<avctx->thread_count; i++){
-        int y= s->thread_context[i]->start_mb_y;
+        int start_y= s->thread_context[i]->start_mb_y;
+        int   end_y= s->thread_context[i]->  end_mb_y;
          int h= s->mb_height;
-        uint8_t *start= buf + buf_size* y   /h;
-        uint8_t *end  = buf + buf_size*(y+1)/h;
+        uint8_t *start= buf + buf_size*start_y/h;
+        uint8_t *end  = buf + buf_size*  end_y/h;
  
          init_put_bits(&s->thread_context[i]->pb, start, end - start);
      }
@@ -2041,7 +2157,7 @@ int MPV_encode_picture(AVCodecContext *avctx,
          }
  
          flush_put_bits(&s->pb);
-        s->frame_bits  = (pbBufPtr(&s->pb) - s->pb.buf) * 8;
+        s->frame_bits  = put_bits_count(&s->pb);
  
          stuffing_count= ff_vbv_update(s, s->frame_bits);
          if(stuffing_count){
@@ -2064,11 +2180,12 @@ int MPV_encode_picture(AVCodecContext *avctx,
                  av_log(s->avctx, AV_LOG_ERROR, "vbv buffer overflow\n");
              }
              flush_put_bits(&s->pb);
-            s->frame_bits  = (pbBufPtr(&s->pb) - s->pb.buf) * 8;
+            s->frame_bits  = put_bits_count(&s->pb);
          }
  
          /* update mpeg1/2 vbv_delay for CBR */    
-        if(s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate){
+        if(s->avctx->rc_max_rate && s->avctx->rc_min_rate == s->avctx->rc_max_rate && s->out_format == FMT_MPEG1
+           && 90000LL * (avctx->rc_buffer_size-1) <= s->avctx->rc_max_rate*0xFFFFLL){
              int vbv_delay;
  
              assert(s->repeat_first_field==0);
@@ -2097,8 +2214,7 @@ int MPV_encode_picture(AVCodecContext *avctx,
  
  static inline void gmc1_motion(MpegEncContext *s,
                                 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
-                               int dest_offset,
-                               uint8_t **ref_picture, int src_offset)
+                               uint8_t **ref_picture)
  {
      uint8_t *ptr;
      int offset, src_x, src_y, linesize, uvlinesize;
@@ -2121,9 +2237,8 @@ static inline void gmc1_motion(MpegEncContext *s,
      linesize = s->linesize;
      uvlinesize = s->uvlinesize;
      
-    ptr = ref_picture[0] + (src_y * linesize) + src_x + src_offset;
+    ptr = ref_picture[0] + (src_y * linesize) + src_x;
  
-    dest_y+=dest_offset;
      if(s->flags&CODEC_FLAG_EMU_EDGE){
          if(   (unsigned)src_x >= s->h_edge_pos - 17
             || (unsigned)src_y >= s->v_edge_pos - 17){
@@ -2161,7 +2276,7 @@ static inline void gmc1_motion(MpegEncContext *s,
      if (src_y == s->height>>1)
          motion_y =0;
  
-    offset = (src_y * uvlinesize) + src_x + (src_offset>>1);
+    offset = (src_y * uvlinesize) + src_x;
      ptr = ref_picture[1] + offset;
      if(s->flags&CODEC_FLAG_EMU_EDGE){
          if(   (unsigned)src_x >= (s->h_edge_pos>>1) - 9
@@ -2171,22 +2286,21 @@ static inline void gmc1_motion(MpegEncContext *s,
              emu=1;
          }
      }
-    s->dsp.gmc1(dest_cb + (dest_offset>>1), ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
+    s->dsp.gmc1(dest_cb, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
      
      ptr = ref_picture[2] + offset;
      if(emu){
          ff_emulated_edge_mc(s->edge_emu_buffer, ptr, uvlinesize, 9, 9, src_x, src_y, s->h_edge_pos>>1, s->v_edge_pos>>1);
          ptr= s->edge_emu_buffer;
      }
-    s->dsp.gmc1(dest_cr + (dest_offset>>1), ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
+    s->dsp.gmc1(dest_cr, ptr, uvlinesize, 8, motion_x&15, motion_y&15, 128 - s->no_rounding);
      
      return;
  }
  
  static inline void gmc_motion(MpegEncContext *s,
                                 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
-                               int dest_offset,
-                               uint8_t **ref_picture, int src_offset)
+                               uint8_t **ref_picture)
  {
      uint8_t *ptr;
      int linesize, uvlinesize;
@@ -2196,10 +2310,8 @@ static inline void gmc_motion(MpegEncContext *s,
      linesize = s->linesize;
      uvlinesize = s->uvlinesize;
  
-    ptr = ref_picture[0] + src_offset;
+    ptr = ref_picture[0];
  
-    dest_y+=dest_offset;
-    
      ox= s->sprite_offset[0][0] + s->sprite_delta[0][0]*s->mb_x*16 + s->sprite_delta[0][1]*s->mb_y*16;
      oy= s->sprite_offset[0][1] + s->sprite_delta[1][0]*s->mb_x*16 + s->sprite_delta[1][1]*s->mb_y*16;
  
@@ -2220,14 +2332,10 @@ static inline void gmc_motion(MpegEncContext *s,
  
      if(s->flags&CODEC_FLAG_GRAY) return;
  
-
-    dest_cb+=dest_offset>>1;
-    dest_cr+=dest_offset>>1;
-    
      ox= s->sprite_offset[1][0] + s->sprite_delta[0][0]*s->mb_x*8 + s->sprite_delta[0][1]*s->mb_y*8;
      oy= s->sprite_offset[1][1] + s->sprite_delta[1][0]*s->mb_x*8 + s->sprite_delta[1][1]*s->mb_y*8;
  
-    ptr = ref_picture[1] + (src_offset>>1);
+    ptr = ref_picture[1];
      s->dsp.gmc(dest_cb, ptr, uvlinesize, 8,
             ox, 
             oy, 
@@ -2236,7 +2344,7 @@ static inline void gmc_motion(MpegEncContext *s,
             a+1, (1<<(2*a+1)) - s->no_rounding,
             s->h_edge_pos>>1, s->v_edge_pos>>1);
      
-    ptr = ref_picture[2] + (src_offset>>1);
+    ptr = ref_picture[2];
      s->dsp.gmc(dest_cr, ptr, uvlinesize, 8,
             ox, 
             oy, 
@@ -2318,7 +2426,8 @@ void ff_emulated_edge_mc(uint8_t *buf, uint8_t *src, int linesize, int block_w,
  }
  
  static inline int hpel_motion(MpegEncContext *s, 
-                                  uint8_t *dest, uint8_t *src, 
+                                  uint8_t *dest, uint8_t *src,
+                                  int field_based, int field_select,
                                    int src_x, int src_y,
                                    int width, int height, int stride,
                                    int h_edge_pos, int v_edge_pos,
@@ -2344,12 +2453,14 @@ static inline int hpel_motion(MpegEncContext *s,
      if(s->unrestricted_mv && (s->flags&CODEC_FLAG_EMU_EDGE)){
          if(   (unsigned)src_x > h_edge_pos - (motion_x&1) - w
             || (unsigned)src_y > v_edge_pos - (motion_y&1) - h){
-            ff_emulated_edge_mc(s->edge_emu_buffer, src, stride, w+1, h+1,
-                             src_x, src_y, h_edge_pos, v_edge_pos);
+            ff_emulated_edge_mc(s->edge_emu_buffer, src, s->linesize, w+1, (h+1)<<field_based,
+                             src_x, src_y<<field_based, h_edge_pos, s->v_edge_pos);
              src= s->edge_emu_buffer;
              emu=1;
          }
      }
+    if(field_select)
+        src += s->linesize;
      pix_op[dxy](dest, src, stride, h);
      return emu;
  }
@@ -2357,14 +2468,13 @@ static inline int hpel_motion(MpegEncContext *s,
  /* apply one mpeg motion vector to the three components */
  static inline void mpeg_motion(MpegEncContext *s,
                                 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
-                               int dest_offset,
-                               uint8_t **ref_picture, int src_offset,
-                               int field_based, op_pixels_func (*pix_op)[4],
+                               int field_based, int bottom_field, int field_select,
+                               uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
                                 int motion_x, int motion_y, int h)
  {
-    uint8_t *ptr;
-    int dxy, offset, mx, my, src_x, src_y, height, v_edge_pos, uvlinesize;
-    int emu=0;
+    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
+    int dxy, uvdxy, mx, my, src_x, src_y, uvsrc_x, uvsrc_y, v_edge_pos, uvlinesize, linesize;
+    
  #if 0    
  if(s->quarter_sample)
  {
@@ -2373,61 +2483,78 @@ if(s->quarter_sample)
  }
  #endif
  
-    height = s->height >> field_based;
      v_edge_pos = s->v_edge_pos >> field_based;
+    linesize   = s->current_picture.linesize[0] << field_based;
      uvlinesize = s->current_picture.linesize[1] << field_based;
  
-    emu= hpel_motion(s, 
-                dest_y + dest_offset, ref_picture[0] + src_offset,
-                s->mb_x * 16, s->mb_y * (16 >> field_based),
-                s->width, height, s->current_picture.linesize[0] << field_based,
-                s->h_edge_pos, v_edge_pos,
-                16, h, pix_op[0],
-                motion_x, motion_y);
-
-
-    if(s->flags&CODEC_FLAG_GRAY) return;
+    dxy = ((motion_y & 1) << 1) | (motion_x & 1);
+    src_x = s->mb_x* 16               + (motion_x >> 1);
+    src_y = s->mb_y*(16>>field_based) + (motion_y >> 1);
  
      if (s->out_format == FMT_H263) {
-        dxy = 0;
-        if ((motion_x & 3) != 0)
-            dxy |= 1;
-        if ((motion_y & 3) != 0)
-            dxy |= 2;
-        mx = motion_x >> 2;
-        my = motion_y >> 2;
+        if((s->workaround_bugs & FF_BUG_HPEL_CHROMA) && field_based){
+            mx = (motion_x>>1)|(motion_x&1);
+            my = motion_y >>1;
+            uvdxy = ((my & 1) << 1) | (mx & 1);
+            uvsrc_x = s->mb_x* 8               + (mx >> 1);
+            uvsrc_y = s->mb_y*(8>>field_based) + (my >> 1);
+        }else{
+            uvdxy = dxy | (motion_y & 2) | ((motion_x & 2) >> 1);
+            uvsrc_x = src_x>>1;
+            uvsrc_y = src_y>>1;
+        }
+    }else if(s->out_format == FMT_H261){//even chroma mv's are full pel in H261
+        mx = motion_x / 4;
+        my = motion_y / 4;
+        uvdxy = 0;
+        uvsrc_x = s->mb_x*8 + mx;
+        uvsrc_y = s->mb_y*8 + my;
      } else {
          mx = motion_x / 2;
          my = motion_y / 2;
-        dxy = ((my & 1) << 1) | (mx & 1);
-        mx >>= 1;
-        my >>= 1;
+        uvdxy = ((my & 1) << 1) | (mx & 1);
+        uvsrc_x = s->mb_x* 8               + (mx >> 1);
+        uvsrc_y = s->mb_y*(8>>field_based) + (my >> 1);
      }
-    
-    src_x = s->mb_x * 8 + mx;
-    src_y = s->mb_y * (8 >> field_based) + my;
-    src_x = clip(src_x, -8, s->width >> 1);
-    if (src_x == (s->width >> 1))
-        dxy &= ~1;
-    src_y = clip(src_y, -8, height >> 1);
-    if (src_y == (height >> 1))
-        dxy &= ~2;
-    offset = (src_y * uvlinesize) + src_x + (src_offset >> 1);
-    ptr = ref_picture[1] + offset;
-    if(emu){
-        ff_emulated_edge_mc(s->edge_emu_buffer, ptr - (src_offset >> 1), s->uvlinesize, 9, 9+field_based, 
-                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
-        ptr= s->edge_emu_buffer + (src_offset >> 1);
+
+    ptr_y  = ref_picture[0] + src_y * linesize + src_x;
+    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
+    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;
+
+    if(   (unsigned)src_x > s->h_edge_pos - (motion_x&1) - 16
+       || (unsigned)src_y >    v_edge_pos - (motion_y&1) - h){
+            ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based,
+                             src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
+            ptr_y = s->edge_emu_buffer;
+            if(!(s->flags&CODEC_FLAG_GRAY)){
+                uint8_t *uvbuf= s->edge_emu_buffer+18*s->linesize;
+                ff_emulated_edge_mc(uvbuf  , ptr_cb, s->uvlinesize, 9, 9+field_based, 
+                                 uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
+                ff_emulated_edge_mc(uvbuf+16, ptr_cr, s->uvlinesize, 9, 9+field_based, 
+                                 uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
+                ptr_cb= uvbuf;
+                ptr_cr= uvbuf+16;
+            }
      }
-    pix_op[1][dxy](dest_cb + (dest_offset >> 1), ptr, uvlinesize, h >> 1);
  
-    ptr = ref_picture[2] + offset;
-    if(emu){
-        ff_emulated_edge_mc(s->edge_emu_buffer, ptr - (src_offset >> 1), s->uvlinesize, 9, 9+field_based, 
-                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
-        ptr= s->edge_emu_buffer + (src_offset >> 1);
+    if(bottom_field){ //FIXME use this for field pix too instead of the obnoxious hack which changes picture.data
+        dest_y += s->linesize;
+        dest_cb+= s->uvlinesize;
+        dest_cr+= s->uvlinesize;
+    }
+
+    if(field_select){
+        ptr_y += s->linesize;
+        ptr_cb+= s->uvlinesize;
+        ptr_cr+= s->uvlinesize;
+    }
+
+    pix_op[0][dxy](dest_y, ptr_y, linesize, h);
+    
+    if(!(s->flags&CODEC_FLAG_GRAY)){
+        pix_op[1][uvdxy](dest_cb, ptr_cb, uvlinesize, h >> 1);
+        pix_op[1][uvdxy](dest_cr, ptr_cr, uvlinesize, h >> 1);
      }
-    pix_op[1][dxy](dest_cr + (dest_offset >> 1), ptr, uvlinesize, h >> 1);
  }
  //FIXME move to dsputil, avg variant, 16x16 version
  static inline void put_obmc(uint8_t *dst, uint8_t *src[5], int stride){
@@ -2499,7 +2626,7 @@ static inline void obmc_motion(MpegEncContext *s,
              ptr[i]= ptr[MID];
          }else{
              ptr[i]= s->obmc_scratchpad + 8*(i&1) + s->linesize*8*(i>>1);
-            hpel_motion(s, ptr[i], src,
+            hpel_motion(s, ptr[i], src, 0, 0,
                          src_x, src_y,
                          s->width, s->height, s->linesize,
                          s->h_edge_pos, s->v_edge_pos,
@@ -2513,54 +2640,22 @@ static inline void obmc_motion(MpegEncContext *s,
  
  static inline void qpel_motion(MpegEncContext *s,
                                 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
-                               int dest_offset,
-                               uint8_t **ref_picture, int src_offset,
-                               int field_based, op_pixels_func (*pix_op)[4],
+                               int field_based, int bottom_field, int field_select,
+                               uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
                                 qpel_mc_func (*qpix_op)[16],
                                 int motion_x, int motion_y, int h)
  {
-    uint8_t *ptr;
-    int dxy, offset, mx, my, src_x, src_y, height, v_edge_pos, linesize, uvlinesize;
-    int emu=0;
+    uint8_t *ptr_y, *ptr_cb, *ptr_cr;
+    int dxy, uvdxy, mx, my, src_x, src_y, uvsrc_x, uvsrc_y, v_edge_pos, linesize, uvlinesize;
  
      dxy = ((motion_y & 3) << 2) | (motion_x & 3);
-    src_x = s->mb_x * 16 + (motion_x >> 2);
+    src_x = s->mb_x *  16                 + (motion_x >> 2);
      src_y = s->mb_y * (16 >> field_based) + (motion_y >> 2);
  
-    height = s->height >> field_based;
      v_edge_pos = s->v_edge_pos >> field_based;
-    src_x = clip(src_x, -16, s->width);
-    if (src_x == s->width)
-        dxy &= ~3;
-    src_y = clip(src_y, -16, height);
-    if (src_y == height)
-        dxy &= ~12;
      linesize = s->linesize << field_based;
      uvlinesize = s->uvlinesize << field_based;
-    ptr = ref_picture[0] + (src_y * linesize) + src_x + src_offset;
-    dest_y += dest_offset;
-//printf("%d %d %d\n", src_x, src_y, dxy);
      
-    if(s->flags&CODEC_FLAG_EMU_EDGE){
-        if(   (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 16 
-           || (unsigned)src_y >    v_edge_pos - (motion_y&3) - h  ){
-            ff_emulated_edge_mc(s->edge_emu_buffer, ptr - src_offset, s->linesize, 17, 17+field_based, 
-                             src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
-            ptr= s->edge_emu_buffer + src_offset;
-            emu=1;
-        }
-    }
-    if(!field_based)
-        qpix_op[0][dxy](dest_y, ptr, linesize);
-    else{
-        //damn interlaced mode
-        //FIXME boundary mirroring is not exactly correct here
-        qpix_op[1][dxy](dest_y  , ptr  , linesize);
-        qpix_op[1][dxy](dest_y+8, ptr+8, linesize);
-    }
-
-    if(s->flags&CODEC_FLAG_GRAY) return;
-
      if(field_based){
          mx= motion_x/2;
          my= motion_y>>1;
@@ -2578,35 +2673,56 @@ static inline void qpel_motion(MpegEncContext *s,
      mx= (mx>>1)|(mx&1);
      my= (my>>1)|(my&1);
  
-    dxy= (mx&1) | ((my&1)<<1);
+    uvdxy= (mx&1) | ((my&1)<<1);
      mx>>=1;
      my>>=1;
  
-    src_x = s->mb_x * 8 + mx;
-    src_y = s->mb_y * (8 >> field_based) + my;
-    src_x = clip(src_x, -8, s->width >> 1);
-    if (src_x == (s->width >> 1))
-        dxy &= ~1;
-    src_y = clip(src_y, -8, height >> 1);
-    if (src_y == (height >> 1))
-        dxy &= ~2;
+    uvsrc_x = s->mb_x *  8                 + mx;
+    uvsrc_y = s->mb_y * (8 >> field_based) + my;
  
-    offset = (src_y * uvlinesize) + src_x + (src_offset >> 1);
-    ptr = ref_picture[1] + offset;
-    if(emu){
-        ff_emulated_edge_mc(s->edge_emu_buffer, ptr - (src_offset >> 1), s->uvlinesize, 9, 9 + field_based, 
-                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
-        ptr= s->edge_emu_buffer + (src_offset >> 1);
+    ptr_y  = ref_picture[0] +   src_y *   linesize +   src_x;
+    ptr_cb = ref_picture[1] + uvsrc_y * uvlinesize + uvsrc_x;
+    ptr_cr = ref_picture[2] + uvsrc_y * uvlinesize + uvsrc_x;
+
+    if(   (unsigned)src_x > s->h_edge_pos - (motion_x&3) - 16 
+       || (unsigned)src_y >    v_edge_pos - (motion_y&3) - h  ){
+        ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, s->linesize, 17, 17+field_based, 
+                         src_x, src_y<<field_based, s->h_edge_pos, s->v_edge_pos);
+        ptr_y= s->edge_emu_buffer;
+        if(!(s->flags&CODEC_FLAG_GRAY)){
+            uint8_t *uvbuf= s->edge_emu_buffer + 18*s->linesize;
+            ff_emulated_edge_mc(uvbuf, ptr_cb, s->uvlinesize, 9, 9 + field_based, 
+                             uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
+            ff_emulated_edge_mc(uvbuf + 16, ptr_cr, s->uvlinesize, 9, 9 + field_based, 
+                             uvsrc_x, uvsrc_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
+            ptr_cb= uvbuf;
+            ptr_cr= uvbuf + 16;
+        }
      }
-    pix_op[1][dxy](dest_cb + (dest_offset >> 1), ptr,  uvlinesize, h >> 1);
-    
-    ptr = ref_picture[2] + offset;
-    if(emu){
-        ff_emulated_edge_mc(s->edge_emu_buffer, ptr - (src_offset >> 1), s->uvlinesize, 9, 9 + field_based, 
-                         src_x, src_y<<field_based, s->h_edge_pos>>1, s->v_edge_pos>>1);
-        ptr= s->edge_emu_buffer + (src_offset >> 1);
+
+    if(!field_based)
+        qpix_op[0][dxy](dest_y, ptr_y, linesize);
+    else{
+        if(bottom_field){
+            dest_y += s->linesize;
+            dest_cb+= s->uvlinesize;
+            dest_cr+= s->uvlinesize;
+        }
+
+        if(field_select){
+            ptr_y  += s->linesize;
+            ptr_cb += s->uvlinesize;
+            ptr_cr += s->uvlinesize;
+        }
+        //damn interlaced mode
+        //FIXME boundary mirroring is not exactly correct here
+        qpix_op[1][dxy](dest_y  , ptr_y  , linesize);
+        qpix_op[1][dxy](dest_y+8, ptr_y+8, linesize);
+    }
+    if(!(s->flags&CODEC_FLAG_GRAY)){
+        pix_op[1][uvdxy](dest_cr, ptr_cr, uvlinesize, h >> 1);
+        pix_op[1][uvdxy](dest_cb, ptr_cb, uvlinesize, h >> 1);
      }
-    pix_op[1][dxy](dest_cr + (dest_offset >> 1), ptr,  uvlinesize, h >> 1);
  }
  
  inline int ff_h263_round_chroma(int x){
@@ -2694,8 +2810,8 @@ static inline void MPV_motion(MpegEncContext *s,
      if(s->obmc && s->pict_type != B_TYPE){
          int16_t mv_cache[4][4][2];
          const int xy= s->mb_x + s->mb_y*s->mb_stride;
-        const int mot_stride= s->mb_width*2 + 2;
-        const int mot_xy= 1 + mb_x*2 + (mb_y*2 + 1)*mot_stride;
+        const int mot_stride= s->b8_stride;
+        const int mot_xy= mb_x*2 + mb_y*2*mot_stride;
  
          assert(!s->mb_skiped);
                  
@@ -2757,16 +2873,16 @@ static inline void MPV_motion(MpegEncContext *s,
  #ifdef CONFIG_RISKY
          if(s->mcsel){
              if(s->real_sprite_warping_points==1){
-                gmc1_motion(s, dest_y, dest_cb, dest_cr, 0,
-                            ref_picture, 0);
+                gmc1_motion(s, dest_y, dest_cb, dest_cr,
+                            ref_picture);
              }else{
-                gmc_motion(s, dest_y, dest_cb, dest_cr, 0,
-                            ref_picture, 0);
+                gmc_motion(s, dest_y, dest_cb, dest_cr,
+                            ref_picture);
              }
          }else if(s->quarter_sample){
-            qpel_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture, 0,
-                        0, pix_op, qpix_op,
+            qpel_motion(s, dest_y, dest_cb, dest_cr, 
+                        0, 0, 0,
+                        ref_picture, pix_op, qpix_op,
                          s->mv[dir][0][0], s->mv[dir][0][1], 16);
          }else if(s->mspel){
              ff_mspel_motion(s, dest_y, dest_cb, dest_cr,
@@ -2775,9 +2891,9 @@ static inline void MPV_motion(MpegEncContext *s,
          }else
  #endif
          {
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture, 0,
-                        0, pix_op,
+            mpeg_motion(s, dest_y, dest_cb, dest_cr, 
+                        0, 0, 0,
+                        ref_picture, pix_op,
                          s->mv[dir][0][0], s->mv[dir][0][1], 16);
          }           
          break;
@@ -2818,7 +2934,7 @@ static inline void MPV_motion(MpegEncContext *s,
          }else{
              for(i=0;i<4;i++) {
                  hpel_motion(s, dest_y + ((i & 1) * 8) + (i >> 1) * 8 * s->linesize,
-                            ref_picture[0],
+                            ref_picture[0], 0, 0,
                              mb_x * 16 + (i & 1) * 8, mb_y * 16 + (i >>1) * 8,
                              s->width, s->height, s->linesize,
                              s->h_edge_pos, s->v_edge_pos,
@@ -2836,140 +2952,83 @@ static inline void MPV_motion(MpegEncContext *s,
      case MV_TYPE_FIELD:
          if (s->picture_structure == PICT_FRAME) {
              if(s->quarter_sample){
-                /* top field */
-                qpel_motion(s, dest_y, dest_cb, dest_cr, 0,
-                            ref_picture, s->field_select[dir][0] ? s->linesize : 0,
-                            1, pix_op, qpix_op,
-                            s->mv[dir][0][0], s->mv[dir][0][1], 8);
-                /* bottom field */
-                qpel_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
-                            ref_picture, s->field_select[dir][1] ? s->linesize : 0,
-                            1, pix_op, qpix_op,
-                            s->mv[dir][1][0], s->mv[dir][1][1], 8);
+                for(i=0; i<2; i++){
+                    qpel_motion(s, dest_y, dest_cb, dest_cr,
+                                1, i, s->field_select[dir][i],
+                                ref_picture, pix_op, qpix_op,
+                                s->mv[dir][i][0], s->mv[dir][i][1], 8);
+                }
              }else{
                  /* top field */       
-                mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                            ref_picture, s->field_select[dir][0] ? s->linesize : 0,
-                            1, pix_op,
+                mpeg_motion(s, dest_y, dest_cb, dest_cr,
+                            1, 0, s->field_select[dir][0],
+                            ref_picture, pix_op,
                              s->mv[dir][0][0], s->mv[dir][0][1], 8);
                  /* bottom field */
-                mpeg_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
-                            ref_picture, s->field_select[dir][1] ? s->linesize : 0,
-                            1, pix_op,
+                mpeg_motion(s, dest_y, dest_cb, dest_cr,
+                            1, 1, s->field_select[dir][1],
+                            ref_picture, pix_op,
                              s->mv[dir][1][0], s->mv[dir][1][1], 8);
              }
          } else {
-            int offset;
-            if(s->picture_structure == s->field_select[dir][0] + 1 || s->pict_type == B_TYPE || s->first_field){
-                offset= s->field_select[dir][0] ? s->linesize : 0;
-            }else{
-                ref_picture= s->current_picture.data;
-                offset= s->field_select[dir][0] ? s->linesize : -s->linesize; 
+            if(s->picture_structure != s->field_select[dir][0] + 1 && s->pict_type != B_TYPE && !s->first_field){
+                ref_picture= s->current_picture_ptr->data;
              } 
  
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture, offset,
-                        0, pix_op,
+            mpeg_motion(s, dest_y, dest_cb, dest_cr,
+                        0, 0, s->field_select[dir][0],
+                        ref_picture, pix_op,
                          s->mv[dir][0][0], s->mv[dir][0][1], 16);
          }
          break;
-    case MV_TYPE_16X8:{
-        int offset;
-         uint8_t ** ref2picture;
+    case MV_TYPE_16X8:
+        for(i=0; i<2; i++){
+            uint8_t ** ref2picture;
  
-            if(s->picture_structure == s->field_select[dir][0] + 1 || s->pict_type == B_TYPE || s->first_field){
+            if(s->picture_structure == s->field_select[dir][i] + 1 || s->pict_type == B_TYPE || s->first_field){
                  ref2picture= ref_picture;
-                offset= s->field_select[dir][0] ? s->linesize : 0;
              }else{
-                ref2picture= s->current_picture.data;
-                offset= s->field_select[dir][0] ? s->linesize : -s->linesize; 
+                ref2picture= s->current_picture_ptr->data;
              } 
  
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref2picture, offset,
-                        0, pix_op,
-                        s->mv[dir][0][0], s->mv[dir][0][1], 8);
-
-
-            if(s->picture_structure == s->field_select[dir][1] + 1 || s->pict_type == B_TYPE || s->first_field){
-                ref2picture= ref_picture;
-                offset= s->field_select[dir][1] ? s->linesize : 0;
-            }else{
-                ref2picture= s->current_picture.data;
-                offset= s->field_select[dir][1] ? s->linesize : -s->linesize; 
-            } 
-            // I know it is ugly but this is the only way to fool emu_edge without rewrite mpeg_motion
-            mpeg_motion(s, dest_y+16*s->linesize, dest_cb+8*s->uvlinesize, dest_cr+8*s->uvlinesize,
-                        0,
-                        ref2picture, offset,
-                        0, pix_op,
-                        s->mv[dir][1][0], s->mv[dir][1][1]+16, 8);
-        }
-        
+            mpeg_motion(s, dest_y, dest_cb, dest_cr, 
+                        0, 0, s->field_select[dir][i],
+                        ref2picture, pix_op,
+                        s->mv[dir][i][0], s->mv[dir][i][1] + 16*i, 8);
+                
+            dest_y += 16*s->linesize;
+            dest_cb+=  8*s->uvlinesize;
+            dest_cr+=  8*s->uvlinesize;
+        }        
          break;
      case MV_TYPE_DMV:
-    {
-    op_pixels_func (*dmv_pix_op)[4];
-    int offset;
-
-        dmv_pix_op = s->dsp.put_pixels_tab;
-
          if(s->picture_structure == PICT_FRAME){
-            //put top field from top field
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture, 0,
-                        1, dmv_pix_op,
-                        s->mv[dir][0][0], s->mv[dir][0][1], 8);
-            //put bottom field from bottom field
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
-                        ref_picture, s->linesize,
-                        1, dmv_pix_op,
-                        s->mv[dir][0][0], s->mv[dir][0][1], 8);
-
-            dmv_pix_op = s->dsp.avg_pixels_tab; 
-        
-            //avg top field from bottom field
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture, s->linesize,
-                        1, dmv_pix_op,
-                        s->mv[dir][2][0], s->mv[dir][2][1], 8);
-            //avg bottom field from top field
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, s->linesize,
-                        ref_picture, 0,
-                        1, dmv_pix_op,
-                        s->mv[dir][3][0], s->mv[dir][3][1], 8);
-
+            for(i=0; i<2; i++){
+                int j;
+                for(j=0; j<2; j++){
+                    mpeg_motion(s, dest_y, dest_cb, dest_cr,
+                                1, j, j^i,
+                                ref_picture, pix_op,
+                                s->mv[dir][2*i + j][0], s->mv[dir][2*i + j][1], 8);
+                }
+                pix_op = s->dsp.avg_pixels_tab; 
+            }
          }else{
-            offset=(s->picture_structure == PICT_BOTTOM_FIELD)? 
-                         s->linesize : 0;
-
-            //put field from the same parity
-            //same parity is never in the same frame
-            mpeg_motion(s, dest_y, dest_cb, dest_cr, 0,
-                        ref_picture,offset,
-                        0,dmv_pix_op,
-                        s->mv[dir][0][0],s->mv[dir][0][1],16);
-
-            // after put we make avg of the same block
-            dmv_pix_op=s->dsp.avg_pixels_tab; 
-
-            //opposite parity is always in the same frame if this is second field
-            if(!s->first_field){
-                ref_picture = s->current_picture.data;    
-                //top field is one linesize from frame beginig
-                offset=(s->picture_structure == PICT_BOTTOM_FIELD)? 
-                        -s->linesize : s->linesize;
-            }else 
-                offset=(s->picture_structure == PICT_BOTTOM_FIELD)? 
-                        0 : s->linesize;
-
-            //avg field from the opposite parity
-            mpeg_motion(s, dest_y, dest_cb, dest_cr,0,
-                        ref_picture, offset,
-                        0,dmv_pix_op,
-                        s->mv[dir][2][0],s->mv[dir][2][1],16);
+            for(i=0; i<2; i++){
+                mpeg_motion(s, dest_y, dest_cb, dest_cr, 
+                            0, 0, s->picture_structure != i+1,
+                            ref_picture, pix_op,
+                            s->mv[dir][2*i][0],s->mv[dir][2*i][1],16);
+
+                // after put we make avg of the same block
+                pix_op=s->dsp.avg_pixels_tab; 
+
+                //opposite parity is always in the same frame if this is second field
+                if(!s->first_field){
+                    ref_picture = s->current_picture_ptr->data;    
+                }
+            }
          }
-    }
      break;
      default: assert(0);
      }
@@ -3008,7 +3067,7 @@ static inline void add_dequant_dct(MpegEncContext *s,
   */
  void ff_clean_intra_table_entries(MpegEncContext *s)
  {
-    int wrap = s->block_wrap[0];
+    int wrap = s->b8_stride;
      int xy = s->block_index[0];
      
      s->dc_val[0][xy           ] = 
@@ -3025,15 +3084,15 @@ void ff_clean_intra_table_entries(MpegEncContext *s)
          s->coded_block[xy + 1 + wrap] = 0;
      }
      /* chroma */
-    wrap = s->block_wrap[4];
-    xy = s->mb_x + 1 + (s->mb_y + 1) * wrap;
+    wrap = s->mb_stride;
+    xy = s->mb_x + s->mb_y * wrap;
      s->dc_val[1][xy] =
      s->dc_val[2][xy] = 1024;
      /* ac pred */
      memset(s->ac_val[1][xy], 0, 16 * sizeof(int16_t));
      memset(s->ac_val[2][xy], 0, 16 * sizeof(int16_t));
      
-    s->mbintra_table[s->mb_x + s->mb_y*s->mb_stride]= 0;
+    s->mbintra_table[xy]= 0;
  }
  
  /* generic function called after a macroblock has been parsed by the
@@ -3060,6 +3119,15 @@ void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64])
      mb_x = s->mb_x;
      mb_y = s->mb_y;
  
+    if(s->avctx->debug&FF_DEBUG_DCT_COEFF) {
+       /* save DCT coefficients */
+       int i,j;
+       DCTELEM *dct = &s->current_picture.dct_coeff[mb_xy*64*6];
+       for(i=0; i<6; i++)
+           for(j=0; j<64; j++)
+               *dct++ = block[i][s->dsp.idct_permutation[j]];
+    }
+
      s->current_picture.qscale_table[mb_xy]= s->qscale;
  
      /* update DC predictors for P macroblocks */
@@ -3125,8 +3193,8 @@ void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64])
              dest_cr= s->dest[2];
          }else{
              dest_y = s->b_scratchpad;
-            dest_cb= s->b_scratchpad+16*s->linesize;
-            dest_cr= s->b_scratchpad+16*s->linesize+8;
+            dest_cb= s->b_scratchpad+16*linesize;
+            dest_cr= s->b_scratchpad+16*linesize+8;
          }
          if (!s->mb_intra) {
              /* motion handling */
@@ -3344,12 +3412,12 @@ void ff_init_block_index(MpegEncContext *s){ //FIXME maybe rename
      const int linesize= s->current_picture.linesize[0]; //not s->linesize as this woulnd be wrong for field pics
      const int uvlinesize= s->current_picture.linesize[1];
          
-    s->block_index[0]= s->block_wrap[0]*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
-    s->block_index[1]= s->block_wrap[0]*(s->mb_y*2 + 1)     + s->mb_x*2;
-    s->block_index[2]= s->block_wrap[0]*(s->mb_y*2 + 2) - 1 + s->mb_x*2;
-    s->block_index[3]= s->block_wrap[0]*(s->mb_y*2 + 2)     + s->mb_x*2;
-    s->block_index[4]= s->block_wrap[4]*(s->mb_y + 1)                    + s->block_wrap[0]*(s->mb_height*2 + 2) + s->mb_x;
-    s->block_index[5]= s->block_wrap[4]*(s->mb_y + 1 + s->mb_height + 2) + s->block_wrap[0]*(s->mb_height*2 + 2) + s->mb_x;
+    s->block_index[0]= s->b8_stride*(s->mb_y*2    ) - 2 + s->mb_x*2;
+    s->block_index[1]= s->b8_stride*(s->mb_y*2    ) - 1 + s->mb_x*2;
+    s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) - 2 + s->mb_x*2;
+    s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
+    s->block_index[4]= s->mb_stride*(s->mb_y + 1)                + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
+    s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x - 1;
      
      if(s->pict_type==B_TYPE && s->avctx->draw_horiz_band && s->picture_structure==PICT_FRAME){
          s->dest[0] = s->current_picture.data[0] + s->mb_x * 16 - 16;
@@ -3398,7 +3466,6 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
      int dct_offset   = s->linesize*8; //default for progressive frames
      uint8_t *ptr_y, *ptr_cb, *ptr_cr;
      int wrap_y, wrap_c;
-    int emu=0;
      
      for(i=0; i<6; i++) skip_dct[i]=0;
      
@@ -3412,18 +3479,26 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
          if(!(s->flags&CODEC_FLAG_QP_RD)){
              s->dquant= s->qscale - last_qp;
  
-            if(s->out_format==FMT_H263)
+            if(s->out_format==FMT_H263){
                  s->dquant= clip(s->dquant, -2, 2); //FIXME RD
              
-            if(s->codec_id==CODEC_ID_MPEG4){        
-                if(!s->mb_intra){
-                    if((s->mv_dir&MV_DIRECT) || s->mv_type==MV_TYPE_8X8)
-                        s->dquant=0;
+                if(s->codec_id==CODEC_ID_MPEG4){        
+                    if(!s->mb_intra){
+                        if(s->pict_type == B_TYPE){
+                            if(s->dquant&1) 
+                                s->dquant= (s->dquant/2)*2;
+                            if(s->mv_dir&MV_DIRECT)
+                                s->dquant= 0;
+                        }
+                        if(s->mv_type==MV_TYPE_8X8)
+                            s->dquant=0;
+                    }
                  }
              }
          }
          ff_set_qscale(s, last_qp + s->dquant);
-    }
+    }else if(s->flags&CODEC_FLAG_QP_RD)
+        ff_set_qscale(s, s->qscale + s->dquant);
  
      wrap_y = s->linesize;
      wrap_c = s->uvlinesize;
@@ -3432,9 +3507,12 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
      ptr_cr = s->new_picture.data[2] + (mb_y * 8 * wrap_c) + mb_x * 8;
  
      if(mb_x*16+16 > s->width || mb_y*16+16 > s->height){
-        ff_emulated_edge_mc(s->edge_emu_buffer, ptr_y, wrap_y, 16, 16, mb_x*16, mb_y*16, s->width, s->height);
+        ff_emulated_edge_mc(s->edge_emu_buffer            , ptr_y , wrap_y,16,16,mb_x*16,mb_y*16, s->width   , s->height);
          ptr_y= s->edge_emu_buffer;
-        emu=1;
+        ff_emulated_edge_mc(s->edge_emu_buffer+18*wrap_y  , ptr_cb, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
+        ptr_cb= s->edge_emu_buffer+18*wrap_y;
+        ff_emulated_edge_mc(s->edge_emu_buffer+18*wrap_y+9, ptr_cr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
+        ptr_cr= s->edge_emu_buffer+18*wrap_y+9;
      }
  
      if (s->mb_intra) {
@@ -3466,12 +3544,6 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
              skip_dct[4]= 1;
              skip_dct[5]= 1;
          }else{
-            if(emu){ //FIXME move out of loop and fix edge_emu_buffer mess
-                ff_emulated_edge_mc(s->edge_emu_buffer, ptr_cb, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
-                ptr_cb= s->edge_emu_buffer;
-                ff_emulated_edge_mc(s->edge_emu_buffer+8, ptr_cr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
-                ptr_cr= s->edge_emu_buffer+8;
-            }
             s->dsp.get_pixels(s->block[4], ptr_cb, wrap_c);
              s->dsp.get_pixels(s->block[5], ptr_cr, wrap_c);
          }
@@ -3532,12 +3604,6 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
              skip_dct[4]= 1;
              skip_dct[5]= 1;
          }else{
-            if(emu){
-                ff_emulated_edge_mc(s->edge_emu_buffer, ptr_cb, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
-                ptr_cb= s->edge_emu_buffer;
-                ff_emulated_edge_mc(s->edge_emu_buffer+8, ptr_cr, wrap_c, 8, 8, mb_x*8, mb_y*8, s->width>>1, s->height>>1);
-                ptr_cr= s->edge_emu_buffer+8;
-            }
              s->dsp.diff_pixels(s->block[4], ptr_cb, dest_cb, wrap_c);
              s->dsp.diff_pixels(s->block[5], ptr_cr, dest_cr, wrap_c);
          }
@@ -3649,64 +3715,6 @@ static void encode_mb(MpegEncContext *s, int motion_x, int motion_y)
  
  #endif //CONFIG_ENCODERS
  
-/**
- * combines the (truncated) bitstream to a complete frame
- * @returns -1 if no complete frame could be created
- */
-int ff_combine_frame( MpegEncContext *s, int next, uint8_t **buf, int *buf_size){
-    ParseContext *pc= &s->parse_context;
-
-#if 0
-    if(pc->overread){
-        printf("overread %d, state:%X next:%d index:%d o_index:%d\n", pc->overread, pc->state, next, pc->index, pc->overread_index);
-        printf("%X %X %X %X\n", (*buf)[0], (*buf)[1],(*buf)[2],(*buf)[3]);
-    }
-#endif
-
-    /* copy overreaded byes from last frame into buffer */
-    for(; pc->overread>0; pc->overread--){
-        pc->buffer[pc->index++]= pc->buffer[pc->overread_index++];
-    }
-    
-    pc->last_index= pc->index;
-
-    /* copy into buffer end return */
-    if(next == END_NOT_FOUND){
-        pc->buffer= av_fast_realloc(pc->buffer, &pc->buffer_size, (*buf_size) + pc->index + FF_INPUT_BUFFER_PADDING_SIZE);
-
-        memcpy(&pc->buffer[pc->index], *buf, *buf_size);
-        pc->index += *buf_size;
-        return -1;
-    }
-
-    *buf_size=
-    pc->overread_index= pc->index + next;
-    
-    /* append to buffer */
-    if(pc->index){
-        pc->buffer= av_fast_realloc(pc->buffer, &pc->buffer_size, next + pc->index + FF_INPUT_BUFFER_PADDING_SIZE);
-
-        memcpy(&pc->buffer[pc->index], *buf, next + FF_INPUT_BUFFER_PADDING_SIZE );
-        pc->index = 0;
-        *buf= pc->buffer;
-    }
-
-    /* store overread bytes */
-    for(;next < 0; next++){
-        pc->state = (pc->state<<8) | pc->buffer[pc->last_index + next];
-        pc->overread++;
-    }
-
-#if 0
-    if(pc->overread){
-        printf("overread %d, state:%X next:%d index:%d o_index:%d\n", pc->overread, pc->state, next, pc->index, pc->overread_index);
-        printf("%X %X %X %X\n", (*buf)[0], (*buf)[1],(*buf)[2],(*buf)[3]);
-    }
-#endif
-
-    return 0;
-}
-
  void ff_mpeg_flush(AVCodecContext *avctx){
      int i;
      MpegEncContext *s = avctx->priv_data;
@@ -3727,26 +3735,32 @@ void ff_mpeg_flush(AVCodecContext *avctx){
      s->parse_context.overread_index= 0;
      s->parse_context.index= 0;
      s->parse_context.last_index= 0;
+    s->bitstream_buffer_size=0;
  }
  
  #ifdef CONFIG_ENCODERS
  void ff_copy_bits(PutBitContext *pb, uint8_t *src, int length)
  {
+    const uint16_t *srcw= (uint16_t*)src;
      int words= length>>4;
      int bits= length&15;
      int i;
  
      if(length==0) return;
      
-//    if(put_bits_count(pb)&7){ //FIXME
-        for(i=0; i<words; i++) put_bits(pb, 16, be2me_16(((uint16_t*)src)[i]));
-/*    }else{
+    if(words < 16){
+        for(i=0; i<words; i++) put_bits(pb, 16, be2me_16(srcw[i]));
+    }else if(put_bits_count(pb)&7){
+        for(i=0; i<words; i++) put_bits(pb, 16, be2me_16(srcw[i]));
+    }else{
+        for(i=0; put_bits_count(pb)&31; i++)
+            put_bits(pb, 8, src[i]);
          flush_put_bits(pb);
-        memcpy(pbBufPtr(pb), src, 2*words);
-        skip_put_bytes(pb, 2*words);
-    }*/
+        memcpy(pbBufPtr(pb), src+i, 2*words-i);
+        skip_put_bytes(pb, 2*words-i);
+    }
          
-    put_bits(pb, bits, be2me_16(((uint16_t*)src)[words])>>(16-bits));
+    put_bits(pb, bits, be2me_16(srcw[words])>>(16-bits));
  }
  
  static inline void copy_context_before_encode(MpegEncContext *d, MpegEncContext *s, int type){
@@ -3945,6 +3959,28 @@ static int estimate_motion_thread(AVCodecContext *c, void *arg){
      return 0;
  }
  
+static int mb_var_thread(AVCodecContext *c, void *arg){
+    MpegEncContext *s= arg;
+    int mb_x, mb_y;
+
+    for(mb_y=s->start_mb_y; mb_y < s->end_mb_y; mb_y++) {
+        for(mb_x=0; mb_x < s->mb_width; mb_x++) {
+            int xx = mb_x * 16;
+            int yy = mb_y * 16;
+            uint8_t *pix = s->new_picture.data[0] + (yy * s->linesize) + xx;
+            int varc;
+            int sum = s->dsp.pix_sum(pix, s->linesize);
+    
+            varc = (s->dsp.pix_norm1(pix, s->linesize) - (((unsigned)(sum*sum))>>8) + 500 + 128)>>8;
+
+            s->current_picture.mb_var [s->mb_stride * mb_y + mb_x] = varc;
+            s->current_picture.mb_mean[s->mb_stride * mb_y + mb_x] = (sum+128)>>8;
+            s->me.mb_var_sum_temp    += varc;
+        }
+    }
+    return 0;
+}
+
  static void write_slice_end(MpegEncContext *s){
      if(s->codec_id==CODEC_ID_MPEG4){
          if(s->partitioned_frame){
@@ -3990,7 +4026,7 @@ static int encode_thread(AVCodecContext *c, void *arg){
      for(i=0; i<3; i++){
          /* init last dc values */
          /* note: quant matrix value (8) is implied here */
-        s->last_dc[i] = 128;
+        s->last_dc[i] = 128 << s->intra_dc_precision;
          
          s->current_picture_ptr->error[i] = 0;
      }
@@ -4040,7 +4076,7 @@ static int encode_thread(AVCodecContext *c, void *arg){
              if(s->rtp_mode){
                  int current_packet_size, is_gob_start;
                  
-                current_packet_size= pbBufPtr(&s->pb) - s->ptr_lastgob; //FIXME wrong
+                current_packet_size= ((put_bits_count(&s->pb)+7)>>3) - (s->ptr_lastgob - s->pb.buf);
                  
                  is_gob_start= s->avctx->rtp_payload_size && current_packet_size >= s->avctx->rtp_payload_size && mb_y + mb_x>0; 
                  
@@ -4084,7 +4120,7 @@ static int encode_thread(AVCodecContext *c, void *arg){
                      }
          
                      if (s->avctx->rtp_callback)
-                        s->avctx->rtp_callback(s->ptr_lastgob, current_packet_size, 0);
+                        s->avctx->rtp_callback(s->avctx, s->ptr_lastgob, current_packet_size, 0);
                      
                      switch(s->codec_id){
                      case CODEC_ID_MPEG4:
@@ -4525,7 +4561,7 @@ static int encode_thread(AVCodecContext *c, void *arg){
          pdif = pbBufPtr(&s->pb) - s->ptr_lastgob;
          /* Call the RTP callback to send the last GOB */
          emms_c();
-        s->avctx->rtp_callback(s->ptr_lastgob, pdif, 0);
+        s->avctx->rtp_callback(s->avctx, s->ptr_lastgob, pdif, 0);
      }
  
      return 0;
@@ -4533,9 +4569,9 @@ static int encode_thread(AVCodecContext *c, void *arg){
  
  #define MERGE(field) dst->field += src->field; src->field=0
  static void merge_context_after_me(MpegEncContext *dst, MpegEncContext *src){
-    MERGE(scene_change_score);
-    MERGE(mc_mb_var_sum_temp);
-    MERGE(mb_var_sum_temp);
+    MERGE(me.scene_change_score);
+    MERGE(me.mc_mb_var_sum_temp);
+    MERGE(me.mb_var_sum_temp);
  }
  
  static void merge_context_after_encode(MpegEncContext *dst, MpegEncContext *src){
@@ -4570,26 +4606,25 @@ static void merge_context_after_encode(MpegEncContext *dst, MpegEncContext *src)
  
  static void encode_picture(MpegEncContext *s, int picture_number)
  {
-    int mb_x, mb_y;
-    int i, j;
+    int i;
      int bits;
  
      s->picture_number = picture_number;
      
      /* Reset the average MB variance */
-    s->mb_var_sum_temp    =
-    s->mc_mb_var_sum_temp = 0;
+    s->me.mb_var_sum_temp    =
+    s->me.mc_mb_var_sum_temp = 0;
  
  #ifdef CONFIG_RISKY
      /* we need to initialize some time vars before we can encode b-frames */
      // RAL: Condition added for MPEG1VIDEO
      if (s->codec_id == CODEC_ID_MPEG1VIDEO || s->codec_id == CODEC_ID_MPEG2VIDEO || (s->h263_pred && !s->h263_msmpeg4))
-        ff_set_mpeg4_time(s, s->picture_number); 
+        ff_set_mpeg4_time(s, s->picture_number);  //FIXME rename and use has_b_frames or similar
  #endif
          
-    s->scene_change_score=0;
+    s->me.scene_change_score=0;
      
-    s->lambda= s->current_picture_ptr->quality; //FIXME qscale / ... stuff for ME ratedistoration
+//    s->lambda= s->current_picture_ptr->quality; //FIXME qscale / ... stuff for ME ratedistoration
      
      if(s->pict_type==I_TYPE){
          if(s->msmpeg4_version >= 3) s->no_rounding=1;
@@ -4601,21 +4636,20 @@ static void encode_picture(MpegEncContext *s, int picture_number)
      
      s->mb_intra=0; //for the rate distoration & bit compare functions
      for(i=1; i<s->avctx->thread_count; i++){
-        update_duplicate_context(s->thread_context[i], s);
+        ff_update_duplicate_context(s->thread_context[i], s);
      }
-    
+
+    ff_init_me(s);
+
      /* Estimate motion for every MB */
      if(s->pict_type != I_TYPE){
-        if(s->pict_type != B_TYPE){
+        if(s->pict_type != B_TYPE && s->avctx->me_threshold==0){
              if((s->avctx->pre_me && s->last_non_b_pict_type==I_TYPE) || s->avctx->pre_me==2){
                  s->avctx->execute(s->avctx, pre_estimate_motion_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
              }
          }
  
          s->avctx->execute(s->avctx, estimate_motion_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
-        for(i=1; i<s->avctx->thread_count; i++){
-            merge_context_after_me(s, s->thread_context[i]);
-        }
      }else /* if(s->pict_type == I_TYPE) */{
          /* I-Frame */
          for(i=0; i<s->mb_stride*s->mb_height; i++)
@@ -4623,28 +4657,17 @@ static void encode_picture(MpegEncContext *s, int picture_number)
          
          if(!s->fixed_qscale){
              /* finding spatial complexity for I-frame rate control */
-            for(mb_y=0; mb_y < s->mb_height; mb_y++) {
-                for(mb_x=0; mb_x < s->mb_width; mb_x++) {
-                    int xx = mb_x * 16;
-                    int yy = mb_y * 16;
-                    uint8_t *pix = s->new_picture.data[0] + (yy * s->linesize) + xx;
-                    int varc;
-                   int sum = s->dsp.pix_sum(pix, s->linesize);
-    
-                   varc = (s->dsp.pix_norm1(pix, s->linesize) - (((unsigned)(sum*sum))>>8) + 500 + 128)>>8;
-
-                    s->current_picture.mb_var [s->mb_stride * mb_y + mb_x] = varc;
-                    s->current_picture.mb_mean[s->mb_stride * mb_y + mb_x] = (sum+128)>>8;
-                    s->mb_var_sum_temp    += varc;
-                }
-            }
+            s->avctx->execute(s->avctx, mb_var_thread, (void**)&(s->thread_context[0]), NULL, s->avctx->thread_count);
          }
      }
-    s->current_picture.mc_mb_var_sum= s->current_picture_ptr->mc_mb_var_sum= s->mc_mb_var_sum_temp;
-    s->current_picture.   mb_var_sum= s->current_picture_ptr->   mb_var_sum= s->   mb_var_sum_temp;
+    for(i=1; i<s->avctx->thread_count; i++){
+        merge_context_after_me(s, s->thread_context[i]);
+    }
+    s->current_picture.mc_mb_var_sum= s->current_picture_ptr->mc_mb_var_sum= s->me.mc_mb_var_sum_temp;
+    s->current_picture.   mb_var_sum= s->current_picture_ptr->   mb_var_sum= s->me.   mb_var_sum_temp;
      emms_c();
  
-    if(s->scene_change_score > s->avctx->scenechange_threshold && s->pict_type == P_TYPE){
+    if(s->me.scene_change_score > s->avctx->scenechange_threshold && s->pict_type == P_TYPE){
          s->pict_type= I_TYPE;
          for(i=0; i<s->mb_stride*s->mb_height; i++)
              s->mb_type[i]= CANDIDATE_MB_TYPE_INTRA;
@@ -4665,6 +4688,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
              ff_fix_long_p_mvs(s);
              ff_fix_long_mvs(s, NULL, 0, s->p_mv_table, s->f_code, CANDIDATE_MB_TYPE_INTER, 0);
              if(s->flags & CODEC_FLAG_INTERLACED_ME){
+                int j;
                  for(i=0; i<2; i++){
                      for(j=0; j<2; j++)
                          ff_fix_long_mvs(s, s->p_field_select_table[i], j, 
@@ -4689,7 +4713,7 @@ static void encode_picture(MpegEncContext *s, int picture_number)
              ff_fix_long_mvs(s, NULL, 0, s->b_bidir_forw_mv_table, s->f_code, CANDIDATE_MB_TYPE_BIDIR, 1);
              ff_fix_long_mvs(s, NULL, 0, s->b_bidir_back_mv_table, s->b_code, CANDIDATE_MB_TYPE_BIDIR, 1);
              if(s->flags & CODEC_FLAG_INTERLACED_ME){
-                int dir;
+                int dir, j;
                  for(dir=0; dir<2; dir++){
                      for(i=0; i<2; i++){
                          for(j=0; j<2; j++){
@@ -5145,7 +5169,6 @@ static int dct_quantize_refine(MpegEncContext *s, //FIXME breaks denoise?
      int prev_run=0;
      int prev_level=0;
      int qmul, qadd, start_i, last_non_zero, i, dc;
-    const int esc_length= s->ac_esc_length;
      uint8_t * length;
      uint8_t * last_length;
      int lambda;
@@ -5253,10 +5276,9 @@ STOP_TIMER("init rem[]")
  #endif
      for(;;){
          int best_score=s->dsp.try_8x8basis(rem, weight, basis[0], 0);
-        int nochange_score= best_score;
          int best_coeff=0;
          int best_change=0;
-        int run2, best_unquant_change, analyze_gradient;
+        int run2, best_unquant_change=0, analyze_gradient;
  #ifdef REFINE_STATS
  {START_TIMER
  #endif
@@ -5776,6 +5798,59 @@ static void dct_unquantize_h263_inter_c(MpegEncContext *s,
      }
  }
  
+static void dct_unquantize_h261_intra_c(MpegEncContext *s, 
+                                  DCTELEM *block, int n, int qscale)
+{
+    int i, level, even;
+    int nCoeffs;
+    
+    assert(s->block_last_index[n]>=0);
+    
+    if (n < 4) 
+        block[0] = block[0] * s->y_dc_scale;
+    else
+        block[0] = block[0] * s->c_dc_scale;
+    even = (qscale & 1)^1;
+    nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
+
+    for(i=1; i<=nCoeffs; i++){
+        level = block[i];
+        if (level){
+            if (level < 0){
+                level = qscale * ((level << 1) - 1) + even;
+            }else{
+                level = qscale * ((level << 1) + 1) - even;
+            }
+        }
+        block[i] = level;
+    }
+}
+
+static void dct_unquantize_h261_inter_c(MpegEncContext *s, 
+                                  DCTELEM *block, int n, int qscale)
+{
+    int i, level, even;
+    int nCoeffs;
+    
+    assert(s->block_last_index[n]>=0);
+
+    even = (qscale & 1)^1;
+    
+    nCoeffs= s->inter_scantable.raster_end[ s->block_last_index[n] ];
+
+    for(i=0; i<=nCoeffs; i++){
+        level = block[i];
+        if (level){
+            if (level < 0){
+                level = qscale * ((level << 1) - 1) + even;
+            }else{
+                level = qscale * ((level << 1) + 1) - even;
+            }
+        }
+        block[i] = level;
+    }
+}
+
  static const AVOption mpeg4_options[] =
  {
      AVOPTION_CODEC_INT("bitrate", "desired video bitrate", bit_rate, 4, 240000000, 800000),