svq3: Prevent illegal reads while parsing extradata.

[ffmpeg] / avconv.c
diff --git a/avconv.c b/avconv.c

index f3e6e288baa99019f970790e3510595d923726bf..418e1fde8b770bd11e395587ba45c21fef7ffe56 100644 (file)
--- a/avconv.c
+++ b/avconv.c
@@ -76,6 +76,11 @@
  
  #include "libavutil/avassert.h"
  
+#define VSYNC_AUTO       -1
+#define VSYNC_PASSTHROUGH 0
+#define VSYNC_CFR         1
+#define VSYNC_VFR         2
+
  const char program_name[] = "avconv";
  const int program_birth_year = 2000;
  
@@ -111,7 +116,7 @@ static int do_hex_dump = 0;
  static int do_pkt_dump = 0;
  static int do_pass = 0;
  static char *pass_logfilename_prefix = NULL;
-static int video_sync_method = -1;
+static int video_sync_method = VSYNC_AUTO;
  static int audio_sync_method = 0;
  static float audio_drift_threshold = 0.1;
  static int copy_ts = 0;
@@ -136,8 +141,7 @@ static float dts_delta_threshold = 10;
  static int print_stats = 1;
  
  static uint8_t *audio_buf;
-static uint8_t *audio_out;
-static unsigned int allocated_audio_out_size, allocated_audio_buf_size;
+static unsigned int allocated_audio_buf_size;
  
  #define DEFAULT_PASS_LOGFILENAME_PREFIX "av2pass"
  
@@ -164,9 +168,11 @@ typedef struct InputStream {
      AVFrame *filtered_frame;
  
      int64_t       start;     /* time when read started */
-    int64_t       next_pts;  /* synthetic pts for cases where pkt.pts
-                                is not defined */
-    int64_t       pts;       /* current pts */
+    /* predicted dts of the next packet read for this stream or (when there are
+     * several frames in a packet) of the next frame in current packet */
+    int64_t       next_dts;
+    /* dts of the last packet read for this stream */
+    int64_t       last_dts;
      PtsCorrectionContext pts_ctx;
      double ts_scale;
      int is_start;            /* is 1 at the start and after a discontinuity */
@@ -200,9 +206,13 @@ typedef struct OutputStream {
      // double sync_ipts;        /* dts from the AVPacket of the demuxer in second units */
      struct InputStream *sync_ist; /* input stream to sync against */
      int64_t sync_opts;       /* output frame counter, could be changed to some true timestamp */ // FIXME look at frame_number
+    /* pts of the first frame encoded for this stream, used for limiting
+     * recording time */
+    int64_t first_pts;
      AVBitStreamFilterContext *bitstream_filters;
      AVCodec *enc;
      int64_t max_frames;
+    AVFrame *output_frame;
  
      /* video only */
      int video_resample;
@@ -416,7 +426,7 @@ static int alloc_buffer(InputStream *ist, FrameBuffer **pbuf)
  {
      AVCodecContext *s = ist->st->codec;
      FrameBuffer  *buf = av_mallocz(sizeof(*buf));
-    int ret;
+    int i, ret;
      const int pixel_size = av_pix_fmt_descriptors[s->pix_fmt].comp[0].step_minus1+1;
      int h_chroma_shift, v_chroma_shift;
      int edge = 32; // XXX should be avcodec_get_edge_width(), but that fails on svq1
@@ -444,7 +454,7 @@ static int alloc_buffer(InputStream *ist, FrameBuffer **pbuf)
      memset(buf->base[0], 128, ret);
  
      avcodec_get_chroma_sub_sample(s->pix_fmt, &h_chroma_shift, &v_chroma_shift);
-    for (int i = 0; i < FF_ARRAY_ELEMS(buf->data); i++) {
+    for (i = 0; i < FF_ARRAY_ELEMS(buf->data); i++) {
          const int h_shift = i==0 ? 0 : h_chroma_shift;
          const int v_shift = i==0 ? 0 : v_chroma_shift;
          if (s->flags & CODEC_FLAG_EMU_EDGE)
@@ -545,7 +555,7 @@ static int configure_video_filters(InputStream *ist, OutputStream *ost)
      /** filter graph containing all filters including input & output */
      AVCodecContext *codec = ost->st->codec;
      AVCodecContext *icodec = ist->st->codec;
-    FFSinkContext ffsink_ctx = { .pix_fmt = codec->pix_fmt };
+    SinkContext sink_ctx = { .pix_fmt = codec->pix_fmt };
      AVRational sample_aspect_ratio;
      char args[255];
      int ret;
@@ -565,8 +575,8 @@ static int configure_video_filters(InputStream *ist, OutputStream *ost)
                                         "src", args, NULL, ost->graph);
      if (ret < 0)
          return ret;
-    ret = avfilter_graph_create_filter(&ost->output_video_filter, &ffsink,
-                                       "out", NULL, &ffsink_ctx, ost->graph);
+    ret = avfilter_graph_create_filter(&ost->output_video_filter, &sink,
+                                       "out", NULL, &sink_ctx, ost->graph);
      if (ret < 0)
          return ret;
      last_filter = ost->input_video_filter;
@@ -603,7 +613,6 @@ static int configure_video_filters(InputStream *ist, OutputStream *ost)
  
          if ((ret = avfilter_graph_parse(ost->graph, ost->avfilter, inputs, outputs, NULL)) < 0)
              return ret;
-        av_freep(&ost->avfilter);
      } else {
          if ((ret = avfilter_link(last_filter, 0, ost->output_video_filter, 0)) < 0)
              return ret;
@@ -667,6 +676,26 @@ void exit_program(int ret)
          avformat_free_context(s);
          av_dict_free(&output_files[i].opts);
      }
+    for (i = 0; i < nb_output_streams; i++) {
+        AVBitStreamFilterContext *bsfc = output_streams[i].bitstream_filters;
+        while (bsfc) {
+            AVBitStreamFilterContext *next = bsfc->next;
+            av_bitstream_filter_close(bsfc);
+            bsfc = next;
+        }
+        output_streams[i].bitstream_filters = NULL;
+
+        if (output_streams[i].output_frame) {
+            AVFrame *frame = output_streams[i].output_frame;
+            if (frame->extended_data != frame->data)
+                av_freep(&frame->extended_data);
+            av_freep(&frame);
+        }
+
+#if CONFIG_AVFILTER
+        av_freep(&output_streams[i].avfilter);
+#endif
+    }
      for (i = 0; i < nb_input_files; i++) {
          avformat_close_input(&input_files[i].ctx);
      }
@@ -688,8 +717,7 @@ void exit_program(int ret)
  
      uninit_opts();
      av_free(audio_buf);
-    av_free(audio_out);
-    allocated_audio_buf_size = allocated_audio_out_size = 0;
+    allocated_audio_buf_size = 0;
  
  #if CONFIG_AVFILTER
      avfilter_uninit();
@@ -839,17 +867,31 @@ static void choose_pixel_fmt(AVStream *st, AVCodec *codec)
  }
  
  static double
-get_sync_ipts(const OutputStream *ost)
+get_sync_ipts(const OutputStream *ost, int64_t pts)
  {
-    const InputStream *ist = ost->sync_ist;
      OutputFile *of = &output_files[ost->file_index];
-    return (double)(ist->pts - of->start_time) / AV_TIME_BASE;
+    return (double)(pts - of->start_time) / AV_TIME_BASE;
  }
  
-static void write_frame(AVFormatContext *s, AVPacket *pkt, AVCodecContext *avctx, AVBitStreamFilterContext *bsfc)
+static void write_frame(AVFormatContext *s, AVPacket *pkt, OutputStream *ost)
  {
+    AVBitStreamFilterContext *bsfc = ost->bitstream_filters;
+    AVCodecContext          *avctx = ost->st->codec;
      int ret;
  
+    /*
+     * Audio encoders may split the packets --  #frames in != #packets out.
+     * But there is no reordering, so we can limit the number of output packets
+     * by simply dropping them here.
+     * Counting encoded video frames needs to be done separately because of
+     * reordering, see do_video_out()
+     */
+    if (!(avctx->codec_type == AVMEDIA_TYPE_VIDEO && avctx->codec)) {
+        if (ost->frame_number >= ost->max_frames)
+            return;
+        ost->frame_number++;
+    }
+
      while (bsfc) {
          AVPacket new_pkt = *pkt;
          int a = av_bitstream_filter_filter(bsfc, avctx, NULL,
@@ -872,6 +914,7 @@ static void write_frame(AVFormatContext *s, AVPacket *pkt, AVCodecContext *avctx
          bsfc = bsfc->next;
      }
  
+    pkt->stream_index = ost->index;
      ret = av_interleaved_write_frame(s, pkt);
      if (ret < 0) {
          print_error("av_interleaved_write_frame()", ret);
@@ -879,6 +922,19 @@ static void write_frame(AVFormatContext *s, AVPacket *pkt, AVCodecContext *avctx
      }
  }
  
+static int check_recording_time(OutputStream *ost)
+{
+    OutputFile *of = &output_files[ost->file_index];
+
+    if (of->recording_time != INT64_MAX &&
+        av_compare_ts(ost->sync_opts - ost->first_pts, ost->st->codec->time_base, of->recording_time,
+                      AV_TIME_BASE_Q) >= 0) {
+        ost->is_past_recording_time = 1;
+        return 0;
+    }
+    return 1;
+}
+
  static void generate_silence(uint8_t* buf, enum AVSampleFormat sample_fmt, size_t size)
  {
      int fill_char = 0x00;
@@ -887,18 +943,78 @@ static void generate_silence(uint8_t* buf, enum AVSampleFormat sample_fmt, size_
      memset(buf, fill_char, size);
  }
  
+static int encode_audio_frame(AVFormatContext *s, OutputStream *ost,
+                              const uint8_t *buf, int buf_size)
+{
+    AVCodecContext *enc = ost->st->codec;
+    AVFrame *frame = NULL;
+    AVPacket pkt;
+    int ret, got_packet;
+
+    av_init_packet(&pkt);
+    pkt.data = NULL;
+    pkt.size = 0;
+
+    if (buf) {
+        if (!ost->output_frame) {
+            ost->output_frame = avcodec_alloc_frame();
+            if (!ost->output_frame) {
+                av_log(NULL, AV_LOG_FATAL, "out-of-memory in encode_audio_frame()\n");
+                exit_program(1);
+            }
+        }
+        frame = ost->output_frame;
+        if (frame->extended_data != frame->data)
+            av_freep(&frame->extended_data);
+        avcodec_get_frame_defaults(frame);
+
+        frame->nb_samples  = buf_size /
+                             (enc->channels * av_get_bytes_per_sample(enc->sample_fmt));
+        if ((ret = avcodec_fill_audio_frame(frame, enc->channels, enc->sample_fmt,
+                                            buf, buf_size, 1)) < 0) {
+            av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
+            exit_program(1);
+        }
+
+        if (!check_recording_time(ost))
+            return 0;
+
+        ost->sync_opts += frame->nb_samples;
+    }
+
+    got_packet = 0;
+    if (avcodec_encode_audio2(enc, &pkt, frame, &got_packet) < 0) {
+        av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
+        exit_program(1);
+    }
+
+    if (got_packet) {
+        if (pkt.pts != AV_NOPTS_VALUE)
+            pkt.pts      = av_rescale_q(pkt.pts,      enc->time_base, ost->st->time_base);
+        if (pkt.dts != AV_NOPTS_VALUE)
+            pkt.dts      = av_rescale_q(pkt.dts,      enc->time_base, ost->st->time_base);
+        if (pkt.duration > 0)
+            pkt.duration = av_rescale_q(pkt.duration, enc->time_base, ost->st->time_base);
+
+        write_frame(s, &pkt, ost);
+
+        audio_size += pkt.size;
+    }
+
+    return pkt.size;
+}
+
  static void do_audio_out(AVFormatContext *s, OutputStream *ost,
                           InputStream *ist, AVFrame *decoded_frame)
  {
      uint8_t *buftmp;
-    int64_t audio_out_size, audio_buf_size;
+    int64_t audio_buf_size;
  
-    int size_out, frame_bytes, ret, resample_changed;
+    int size_out, frame_bytes, resample_changed;
      AVCodecContext *enc = ost->st->codec;
      AVCodecContext *dec = ist->st->codec;
      int osize = av_get_bytes_per_sample(enc->sample_fmt);
      int isize = av_get_bytes_per_sample(dec->sample_fmt);
-    const int coded_bps = av_get_bits_per_sample(enc->codec->id);
      uint8_t *buf = decoded_frame->data[0];
      int size     = decoded_frame->nb_samples * dec->channels * isize;
      int64_t allocated_for_size = size;
@@ -910,19 +1026,13 @@ need_realloc:
      audio_buf_size  = FFMAX(audio_buf_size, enc->frame_size);
      audio_buf_size *= osize * enc->channels;
  
-    audio_out_size = FFMAX(audio_buf_size, enc->frame_size * osize * enc->channels);
-    if (coded_bps > 8 * osize)
-        audio_out_size = audio_out_size * coded_bps / (8*osize);
-    audio_out_size += FF_MIN_BUFFER_SIZE;
-
-    if (audio_out_size > INT_MAX || audio_buf_size > INT_MAX) {
+    if (audio_buf_size > INT_MAX) {
          av_log(NULL, AV_LOG_FATAL, "Buffer sizes too large\n");
          exit_program(1);
      }
  
      av_fast_malloc(&audio_buf, &allocated_audio_buf_size, audio_buf_size);
-    av_fast_malloc(&audio_out, &allocated_audio_out_size, audio_out_size);
-    if (!audio_buf || !audio_out) {
+    if (!audio_buf) {
          av_log(NULL, AV_LOG_FATAL, "Out of memory in do_audio_out\n");
          exit_program(1);
      }
@@ -986,7 +1096,7 @@ need_realloc:
      }
  
      if (audio_sync_method) {
-        double delta = get_sync_ipts(ost) * enc->sample_rate - ost->sync_opts -
+        double delta = get_sync_ipts(ost, ist->last_dts) * enc->sample_rate - ost->sync_opts -
                         av_fifo_size(ost->fifo) / (enc->channels * osize);
          int idelta = delta * dec->sample_rate / enc->sample_rate;
          int byte_delta = idelta * isize * dec->channels;
@@ -1029,7 +1139,7 @@ need_realloc:
              }
          }
      } else
-        ost->sync_opts = lrintf(get_sync_ipts(ost) * enc->sample_rate) -
+        ost->sync_opts = lrintf(get_sync_ipts(ost, ist->last_dts) * enc->sample_rate) -
                                  av_fifo_size(ost->fifo) / (enc->channels * osize); // FIXME wrong
  
      if (ost->audio_resample) {
@@ -1060,7 +1170,7 @@ need_realloc:
      }
  
      /* now encode as many frames as possible */
-    if (enc->frame_size > 1) {
+    if (!(enc->codec->capabilities & CODEC_CAP_VARIABLE_FRAME_SIZE)) {
          /* output resampled raw samples */
          if (av_fifo_realloc2(ost->fifo, av_fifo_size(ost->fifo) + size_out) < 0) {
              av_log(NULL, AV_LOG_FATAL, "av_fifo_realloc2() failed\n");
@@ -1071,62 +1181,11 @@ need_realloc:
          frame_bytes = enc->frame_size * osize * enc->channels;
  
          while (av_fifo_size(ost->fifo) >= frame_bytes) {
-            AVPacket pkt;
-            av_init_packet(&pkt);
-
              av_fifo_generic_read(ost->fifo, audio_buf, frame_bytes, NULL);
-
-            // FIXME pass ost->sync_opts as AVFrame.pts in avcodec_encode_audio()
-
-            ret = avcodec_encode_audio(enc, audio_out, audio_out_size,
-                                       (short *)audio_buf);
-            if (ret < 0) {
-                av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
-                exit_program(1);
-            }
-            audio_size += ret;
-            pkt.stream_index = ost->index;
-            pkt.data = audio_out;
-            pkt.size = ret;
-            if (enc->coded_frame && enc->coded_frame->pts != AV_NOPTS_VALUE)
-                pkt.pts = av_rescale_q(enc->coded_frame->pts, enc->time_base, ost->st->time_base);
-            pkt.flags |= AV_PKT_FLAG_KEY;
-            write_frame(s, &pkt, enc, ost->bitstream_filters);
-
-            ost->sync_opts += enc->frame_size;
+            encode_audio_frame(s, ost, audio_buf, frame_bytes);
          }
      } else {
-        AVPacket pkt;
-        av_init_packet(&pkt);
-
-        ost->sync_opts += size_out / (osize * enc->channels);
-
-        /* output a pcm frame */
-        /* determine the size of the coded buffer */
-        size_out /= osize;
-        if (coded_bps)
-            size_out = size_out * coded_bps / 8;
-
-        if (size_out > audio_out_size) {
-            av_log(NULL, AV_LOG_FATAL, "Internal error, buffer size too small\n");
-            exit_program(1);
-        }
-
-        // FIXME pass ost->sync_opts as AVFrame.pts in avcodec_encode_audio()
-        ret = avcodec_encode_audio(enc, audio_out, size_out,
-                                   (short *)buftmp);
-        if (ret < 0) {
-            av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
-            exit_program(1);
-        }
-        audio_size += ret;
-        pkt.stream_index = ost->index;
-        pkt.data = audio_out;
-        pkt.size = ret;
-        if (enc->coded_frame && enc->coded_frame->pts != AV_NOPTS_VALUE)
-            pkt.pts = av_rescale_q(enc->coded_frame->pts, enc->time_base, ost->st->time_base);
-        pkt.flags |= AV_PKT_FLAG_KEY;
-        write_frame(s, &pkt, enc, ost->bitstream_filters);
+        encode_audio_frame(s, ost, buftmp, size_out);
      }
  }
  
@@ -1203,6 +1262,10 @@ static void do_subtitle_out(AVFormatContext *s,
          nb = 1;
  
      for (i = 0; i < nb; i++) {
+        ost->sync_opts = av_rescale_q(pts, ist->st->time_base, enc->time_base);
+        if (!check_recording_time(ost))
+            return;
+
          sub->pts = av_rescale_q(pts, ist->st->time_base, AV_TIME_BASE_Q);
          // start_display_time is required to be 0
          sub->pts               += av_rescale_q(sub->start_display_time, (AVRational){ 1, 1000 }, AV_TIME_BASE_Q);
@@ -1216,7 +1279,6 @@ static void do_subtitle_out(AVFormatContext *s,
          }
  
          av_init_packet(&pkt);
-        pkt.stream_index = ost->index;
          pkt.data = subtitle_out;
          pkt.size = subtitle_out_size;
          pkt.pts  = av_rescale_q(sub->pts, AV_TIME_BASE_Q, ost->st->time_base);
@@ -1228,37 +1290,33 @@ static void do_subtitle_out(AVFormatContext *s,
              else
                  pkt.pts += 90 * sub->end_display_time;
          }
-        write_frame(s, &pkt, ost->st->codec, ost->bitstream_filters);
+        write_frame(s, &pkt, ost);
      }
  }
  
-static int bit_buffer_size = 1024 * 256;
-static uint8_t *bit_buffer = NULL;
-
+#if !CONFIG_AVFILTER
  static void do_video_resample(OutputStream *ost,
                                InputStream *ist,
                                AVFrame *in_picture,
                                AVFrame **out_picture)
  {
      int resample_changed = 0;
-    AVCodecContext *dec = ist->st->codec;
      *out_picture = in_picture;
  
-    resample_changed = ost->resample_width   != dec->width  ||
-                       ost->resample_height  != dec->height ||
-                       ost->resample_pix_fmt != dec->pix_fmt;
+    resample_changed = ost->resample_width   != in_picture->width  ||
+                       ost->resample_height  != in_picture->height ||
+                       ost->resample_pix_fmt != in_picture->format;
  
      if (resample_changed) {
          av_log(NULL, AV_LOG_INFO,
                 "Input stream #%d:%d frame changed from size:%dx%d fmt:%s to size:%dx%d fmt:%s\n",
                 ist->file_index, ist->st->index,
                 ost->resample_width, ost->resample_height, av_get_pix_fmt_name(ost->resample_pix_fmt),
-               dec->width         , dec->height         , av_get_pix_fmt_name(dec->pix_fmt));
+               in_picture->width, in_picture->height, av_get_pix_fmt_name(in_picture->format));
          if (!ost->video_resample)
              ost->video_resample = 1;
      }
  
-#if !CONFIG_AVFILTER
      if (ost->video_resample) {
          *out_picture = &ost->pict_tmp;
          if (resample_changed) {
@@ -1280,21 +1338,13 @@ static void do_video_resample(OutputStream *ost,
          sws_scale(ost->img_resample_ctx, in_picture->data, in_picture->linesize,
                0, ost->resample_height, (*out_picture)->data, (*out_picture)->linesize);
      }
-#else
      if (resample_changed) {
-        avfilter_graph_free(&ost->graph);
-        if (configure_video_filters(ist, ost)) {
-            av_log(NULL, AV_LOG_FATAL, "Error reinitializing filters!\n");
-            exit_program(1);
-        }
-    }
-#endif
-    if (resample_changed) {
-        ost->resample_width   = dec->width;
-        ost->resample_height  = dec->height;
-        ost->resample_pix_fmt = dec->pix_fmt;
+        ost->resample_width   = in_picture->width;
+        ost->resample_height  = in_picture->height;
+        ost->resample_pix_fmt = in_picture->format;
      }
  }
+#endif
  
  
  static void do_video_out(AVFormatContext *s,
@@ -1310,7 +1360,7 @@ static void do_video_out(AVFormatContext *s,
  
      enc = ost->st->codec;
  
-    sync_ipts = get_sync_ipts(ost) / av_q2d(enc->time_base);
+    sync_ipts = get_sync_ipts(ost, in_picture->pts) / av_q2d(enc->time_base);
  
      /* by default, we output a single frame */
      nb_frames = 1;
@@ -1318,23 +1368,22 @@ static void do_video_out(AVFormatContext *s,
      *frame_size = 0;
  
      format_video_sync = video_sync_method;
-    if (format_video_sync < 0)
-        format_video_sync = (s->oformat->flags & AVFMT_NOTIMESTAMPS) ? 0 :
-                            (s->oformat->flags & AVFMT_VARIABLE_FPS) ? 2 : 1;
+    if (format_video_sync == VSYNC_AUTO)
+        format_video_sync = (s->oformat->flags & AVFMT_NOTIMESTAMPS) ? VSYNC_PASSTHROUGH :
+                            (s->oformat->flags & AVFMT_VARIABLE_FPS) ? VSYNC_VFR : VSYNC_CFR;
  
-    if (format_video_sync) {
+    if (format_video_sync != VSYNC_PASSTHROUGH) {
          double vdelta = sync_ipts - ost->sync_opts;
          // FIXME set to 0.5 after we fix some dts/pts bugs like in avidec.c
          if (vdelta < -1.1)
              nb_frames = 0;
-        else if (format_video_sync == 2) {
+        else if (format_video_sync == VSYNC_VFR) {
              if (vdelta <= -0.6) {
                  nb_frames = 0;
              } else if (vdelta > 0.6)
                  ost->sync_opts = lrintf(sync_ipts);
          } else if (vdelta > 1.1)
              nb_frames = lrintf(vdelta);
-//fprintf(stderr, "vdelta:%f, ost->sync_opts:%"PRId64", ost->sync_ipts:%f nb_frames:%d\n", vdelta, ost->sync_opts, get_sync_ipts(ost), nb_frames);
          if (nb_frames == 0) {
              ++nb_frames_drop;
              av_log(NULL, AV_LOG_VERBOSE, "*** drop!\n");
@@ -1349,13 +1398,24 @@ static void do_video_out(AVFormatContext *s,
      if (nb_frames <= 0)
          return;
  
+#if !CONFIG_AVFILTER
      do_video_resample(ost, ist, in_picture, &final_picture);
+#else
+    final_picture = in_picture;
+#endif
+
+    if (!ost->frame_number)
+        ost->first_pts = ost->sync_opts;
  
      /* duplicates frame if needed */
      for (i = 0; i < nb_frames; i++) {
          AVPacket pkt;
          av_init_packet(&pkt);
-        pkt.stream_index = ost->index;
+        pkt.data = NULL;
+        pkt.size = 0;
+
+        if (!check_recording_time(ost))
+            return;
  
          if (s->oformat->flags & AVFMT_RAWPICTURE &&
              enc->codec->id == CODEC_ID_RAWVIDEO) {
@@ -1369,8 +1429,9 @@ static void do_video_out(AVFormatContext *s,
              pkt.pts    = av_rescale_q(ost->sync_opts, enc->time_base, ost->st->time_base);
              pkt.flags |= AV_PKT_FLAG_KEY;
  
-            write_frame(s, &pkt, ost->st->codec, ost->bitstream_filters);
+            write_frame(s, &pkt, ost);
          } else {
+            int got_packet;
              AVFrame big_picture;
  
              big_picture = *final_picture;
@@ -1389,39 +1450,28 @@ static void do_video_out(AVFormatContext *s,
              big_picture.quality = quality;
              if (!enc->me_threshold)
                  big_picture.pict_type = 0;
-//            big_picture.pts = AV_NOPTS_VALUE;
              big_picture.pts = ost->sync_opts;
-//            big_picture.pts= av_rescale(ost->sync_opts, AV_TIME_BASE*(int64_t)enc->time_base.num, enc->time_base.den);
-// av_log(NULL, AV_LOG_DEBUG, "%"PRId64" -> encoder\n", ost->sync_opts);
              if (ost->forced_kf_index < ost->forced_kf_count &&
                  big_picture.pts >= ost->forced_kf_pts[ost->forced_kf_index]) {
                  big_picture.pict_type = AV_PICTURE_TYPE_I;
                  ost->forced_kf_index++;
              }
-            ret = avcodec_encode_video(enc,
-                                       bit_buffer, bit_buffer_size,
-                                       &big_picture);
+            ret = avcodec_encode_video2(enc, &pkt, &big_picture, &got_packet);
              if (ret < 0) {
                  av_log(NULL, AV_LOG_FATAL, "Video encoding failed\n");
                  exit_program(1);
              }
  
-            if (ret > 0) {
-                pkt.data = bit_buffer;
-                pkt.size = ret;
-                if (enc->coded_frame->pts != AV_NOPTS_VALUE)
-                    pkt.pts = av_rescale_q(enc->coded_frame->pts, enc->time_base, ost->st->time_base);
-/*av_log(NULL, AV_LOG_DEBUG, "encoder -> %"PRId64"/%"PRId64"\n",
-   pkt.pts != AV_NOPTS_VALUE ? av_rescale(pkt.pts, enc->time_base.den, AV_TIME_BASE*(int64_t)enc->time_base.num) : -1,
-   pkt.dts != AV_NOPTS_VALUE ? av_rescale(pkt.dts, enc->time_base.den, AV_TIME_BASE*(int64_t)enc->time_base.num) : -1);*/
-
-                if (enc->coded_frame->key_frame)
-                    pkt.flags |= AV_PKT_FLAG_KEY;
-                write_frame(s, &pkt, ost->st->codec, ost->bitstream_filters);
+            if (got_packet) {
+                if (pkt.pts != AV_NOPTS_VALUE)
+                    pkt.pts = av_rescale_q(pkt.pts, enc->time_base, ost->st->time_base);
+                if (pkt.dts != AV_NOPTS_VALUE)
+                    pkt.dts = av_rescale_q(pkt.dts, enc->time_base, ost->st->time_base);
+
+                write_frame(s, &pkt, ost);
                  *frame_size = ret;
                  video_size += ret;
-                // fprintf(stderr,"\nFrame: %3d size: %5d type: %d",
-                //         enc->frame_number-1, ret, enc->pict_type);
+
                  /* if two pass, output log */
                  if (ost->logfile && enc->stats_out) {
                      fprintf(ost->logfile, "%s", enc->stats_out);
@@ -1429,6 +1479,11 @@ static void do_video_out(AVFormatContext *s,
              }
          }
          ost->sync_opts++;
+        /*
+         * For video, number of frames in == number of packets out.
+         * But there may be reordering, so we can't throw away frames on encoder
+         * flush, we need to limit them here, before they go into encoder.
+         */
          ost->frame_number++;
      }
  }
@@ -1606,6 +1661,7 @@ static void flush_encoders(OutputStream *ost_table, int nb_ostreams)
          OutputStream   *ost = &ost_table[i];
          AVCodecContext *enc = ost->st->codec;
          AVFormatContext *os = output_files[ost->file_index].ctx;
+        int stop_encoding = 0;
  
          if (!ost->encoding_needed)
              continue;
@@ -1617,68 +1673,63 @@ static void flush_encoders(OutputStream *ost_table, int nb_ostreams)
  
          for (;;) {
              AVPacket pkt;
-            int fifo_bytes;
+            int fifo_bytes, got_packet;
              av_init_packet(&pkt);
-            pkt.stream_index = ost->index;
+            pkt.data = NULL;
+            pkt.size = 0;
  
              switch (ost->st->codec->codec_type) {
              case AVMEDIA_TYPE_AUDIO:
                  fifo_bytes = av_fifo_size(ost->fifo);
-                ret = 0;
-                /* encode any samples remaining in fifo */
                  if (fifo_bytes > 0) {
-                    int osize = av_get_bytes_per_sample(enc->sample_fmt);
-                    int fs_tmp = enc->frame_size;
+                    /* encode any samples remaining in fifo */
+                    int frame_bytes = fifo_bytes;
  
                      av_fifo_generic_read(ost->fifo, audio_buf, fifo_bytes, NULL);
-                    if (enc->codec->capabilities & CODEC_CAP_SMALL_LAST_FRAME) {
-                        enc->frame_size = fifo_bytes / (osize * enc->channels);
-                    } else { /* pad */
-                        int frame_bytes = enc->frame_size*osize*enc->channels;
+
+                    /* pad last frame with silence if needed */
+                    if (!(enc->codec->capabilities & CODEC_CAP_SMALL_LAST_FRAME)) {
+                        frame_bytes = enc->frame_size * enc->channels *
+                                      av_get_bytes_per_sample(enc->sample_fmt);
                          if (allocated_audio_buf_size < frame_bytes)
                              exit_program(1);
                          generate_silence(audio_buf+fifo_bytes, enc->sample_fmt, frame_bytes - fifo_bytes);
                      }
-
-                    ret = avcodec_encode_audio(enc, bit_buffer, bit_buffer_size, (short *)audio_buf);
-                    pkt.duration = av_rescale((int64_t)enc->frame_size*ost->st->time_base.den,
-                                              ost->st->time_base.num, enc->sample_rate);
-                    enc->frame_size = fs_tmp;
-                }
-                if (ret <= 0) {
-                    ret = avcodec_encode_audio(enc, bit_buffer, bit_buffer_size, NULL);
-                }
-                if (ret < 0) {
-                    av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
-                    exit_program(1);
+                    encode_audio_frame(os, ost, audio_buf, frame_bytes);
+                } else {
+                    /* flush encoder with NULL frames until it is done
+                       returning packets */
+                    if (encode_audio_frame(os, ost, NULL, 0) == 0) {
+                        stop_encoding = 1;
+                        break;
+                    }
                  }
-                audio_size += ret;
-                pkt.flags  |= AV_PKT_FLAG_KEY;
                  break;
              case AVMEDIA_TYPE_VIDEO:
-                ret = avcodec_encode_video(enc, bit_buffer, bit_buffer_size, NULL);
+                ret = avcodec_encode_video2(enc, &pkt, NULL, &got_packet);
                  if (ret < 0) {
                      av_log(NULL, AV_LOG_FATAL, "Video encoding failed\n");
                      exit_program(1);
                  }
                  video_size += ret;
-                if (enc->coded_frame && enc->coded_frame->key_frame)
-                    pkt.flags |= AV_PKT_FLAG_KEY;
                  if (ost->logfile && enc->stats_out) {
                      fprintf(ost->logfile, "%s", enc->stats_out);
                  }
+                if (!got_packet) {
+                    stop_encoding = 1;
+                    break;
+                }
+                if (pkt.pts != AV_NOPTS_VALUE)
+                    pkt.pts = av_rescale_q(pkt.pts, enc->time_base, ost->st->time_base);
+                if (pkt.dts != AV_NOPTS_VALUE)
+                    pkt.dts = av_rescale_q(pkt.dts, enc->time_base, ost->st->time_base);
+                write_frame(os, &pkt, ost);
                  break;
              default:
-                ret = -1;
+                stop_encoding = 1;
              }
-
-            if (ret <= 0)
+            if (stop_encoding)
                  break;
-            pkt.data = bit_buffer;
-            pkt.size = ret;
-            if (enc->coded_frame && enc->coded_frame->pts != AV_NOPTS_VALUE)
-                pkt.pts = av_rescale_q(enc->coded_frame->pts, enc->time_base, ost->st->time_base);
-            write_frame(os, &pkt, ost->st->codec, ost->bitstream_filters);
          }
      }
  }
@@ -1694,16 +1745,9 @@ static int check_output_constraints(InputStream *ist, OutputStream *ost)
      if (ost->source_index != ist_index)
          return 0;
  
-    if (of->start_time && ist->pts < of->start_time)
+    if (of->start_time && ist->last_dts < of->start_time)
          return 0;
  
-    if (of->recording_time != INT64_MAX &&
-        av_compare_ts(ist->pts, AV_TIME_BASE_Q, of->recording_time + of->start_time,
-                      (AVRational){ 1, 1000000 }) >= 0) {
-        ost->is_past_recording_time = 1;
-        return 0;
-    }
-
      return 1;
  }
  
@@ -1719,6 +1763,12 @@ static void do_streamcopy(InputStream *ist, OutputStream *ost, const AVPacket *p
          !ost->copy_initial_nonkeyframes)
          return;
  
+    if (of->recording_time != INT64_MAX &&
+        ist->last_dts >= of->recording_time + of->start_time) {
+        ost->is_past_recording_time = 1;
+        return;
+    }
+
      /* force the input stream PTS */
      if (ost->st->codec->codec_type == AVMEDIA_TYPE_AUDIO)
          audio_size += pkt->size;
@@ -1727,14 +1777,13 @@ static void do_streamcopy(InputStream *ist, OutputStream *ost, const AVPacket *p
          ost->sync_opts++;
      }
  
-    opkt.stream_index = ost->index;
      if (pkt->pts != AV_NOPTS_VALUE)
          opkt.pts = av_rescale_q(pkt->pts, ist->st->time_base, ost->st->time_base) - ost_tb_start_time;
      else
          opkt.pts = AV_NOPTS_VALUE;
  
      if (pkt->dts == AV_NOPTS_VALUE)
-        opkt.dts = av_rescale_q(ist->pts, AV_TIME_BASE_Q, ost->st->time_base);
+        opkt.dts = av_rescale_q(ist->last_dts, AV_TIME_BASE_Q, ost->st->time_base);
      else
          opkt.dts = av_rescale_q(pkt->dts, ist->st->time_base, ost->st->time_base);
      opkt.dts -= ost_tb_start_time;
@@ -1754,16 +1803,15 @@ static void do_streamcopy(InputStream *ist, OutputStream *ost, const AVPacket *p
          opkt.size = pkt->size;
      }
  
-    write_frame(of->ctx, &opkt, ost->st->codec, ost->bitstream_filters);
+    write_frame(of->ctx, &opkt, ost);
      ost->st->codec->frame_number++;
-    ost->frame_number++;
      av_free_packet(&opkt);
  }
  
  static void rate_emu_sleep(InputStream *ist)
  {
      if (input_files[ist->file_index].rate_emu) {
-        int64_t pts = av_rescale(ist->pts, 1000000, AV_TIME_BASE);
+        int64_t pts = av_rescale(ist->last_dts, 1000000, AV_TIME_BASE);
          int64_t now = av_gettime() - ist->start;
          if (pts > now)
              usleep(pts - now);
@@ -1796,11 +1844,11 @@ static int transcode_audio(InputStream *ist, AVPacket *pkt, int *got_output)
      /* if the decoder provides a pts, use it instead of the last packet pts.
         the decoder could be delaying output by a packet or more. */
      if (decoded_frame->pts != AV_NOPTS_VALUE)
-        ist->next_pts = decoded_frame->pts;
+        ist->next_dts = decoded_frame->pts;
  
-    /* increment next_pts to use for the case where the input stream does not
+    /* increment next_dts to use for the case where the input stream does not
         have timestamps or there are multiple frames in the packet */
-    ist->next_pts += ((int64_t)AV_TIME_BASE * decoded_frame->nb_samples) /
+    ist->next_dts += ((int64_t)AV_TIME_BASE * decoded_frame->nb_samples) /
                       avctx->sample_rate;
  
      // preprocess audio (volume)
@@ -1890,7 +1938,7 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
          avcodec_get_frame_defaults(ist->decoded_frame);
      decoded_frame = ist->decoded_frame;
      pkt->pts  = *pkt_pts;
-    pkt->dts  = ist->pts;
+    pkt->dts  = ist->last_dts;
      *pkt_pts  = AV_NOPTS_VALUE;
  
      ret = avcodec_decode_video2(ist->st->codec,
@@ -1903,17 +1951,8 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
          /* no picture yet */
          return ret;
      }
-    ist->next_pts = ist->pts = guess_correct_pts(&ist->pts_ctx, decoded_frame->pkt_pts,
-                                                 decoded_frame->pkt_dts);
-    if (pkt->duration)
-        ist->next_pts += av_rescale_q(pkt->duration, ist->st->time_base, AV_TIME_BASE_Q);
-    else if (ist->st->codec->time_base.num != 0) {
-        int ticks      = ist->st->parser ? ist->st->parser->repeat_pict + 1 :
-                                           ist->st->codec->ticks_per_frame;
-        ist->next_pts += ((int64_t)AV_TIME_BASE *
-                          ist->st->codec->time_base.num * ticks) /
-                          ist->st->codec->time_base.den;
-    }
+    decoded_frame->pts = guess_correct_pts(&ist->pts_ctx, decoded_frame->pkt_pts,
+                                           decoded_frame->pkt_dts);
      pkt->size = 0;
      pre_process_video_frame(ist, (AVPicture *)decoded_frame, &buffer_to_free);
  
@@ -1921,12 +1960,33 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
  
      for (i = 0; i < nb_output_streams; i++) {
          OutputStream *ost = &output_streams[i];
-        int frame_size;
+        int frame_size, resample_changed;
  
          if (!check_output_constraints(ist, ost) || !ost->encoding_needed)
              continue;
  
  #if CONFIG_AVFILTER
+        resample_changed = ost->resample_width   != decoded_frame->width  ||
+                           ost->resample_height  != decoded_frame->height ||
+                           ost->resample_pix_fmt != decoded_frame->format;
+        if (resample_changed) {
+            av_log(NULL, AV_LOG_INFO,
+                    "Input stream #%d:%d frame changed from size:%dx%d fmt:%s to size:%dx%d fmt:%s\n",
+                    ist->file_index, ist->st->index,
+                    ost->resample_width,  ost->resample_height,  av_get_pix_fmt_name(ost->resample_pix_fmt),
+                    decoded_frame->width, decoded_frame->height, av_get_pix_fmt_name(decoded_frame->format));
+
+            avfilter_graph_free(&ost->graph);
+            if (configure_video_filters(ist, ost)) {
+                av_log(NULL, AV_LOG_FATAL, "Error reinitializing filters!\n");
+                exit_program(1);
+            }
+
+            ost->resample_width   = decoded_frame->width;
+            ost->resample_height  = decoded_frame->height;
+            ost->resample_pix_fmt = decoded_frame->format;
+        }
+
          if (ist->st->sample_aspect_ratio.num)
              decoded_frame->sample_aspect_ratio = ist->st->sample_aspect_ratio;
          if (ist->st->codec->codec->capabilities & CODEC_CAP_DR1) {
@@ -1938,7 +1998,6 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
                                          ist->st->codec->pix_fmt);
  
              avfilter_copy_frame_props(fb, decoded_frame);
-            fb->pts                 = ist->pts;
              fb->buf->priv           = buf;
              fb->buf->free           = filter_release_buffer;
  
@@ -1946,7 +2005,7 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
              av_buffersrc_buffer(ost->input_video_filter, fb);
          } else
              av_vsrc_buffer_add_frame(ost->input_video_filter, decoded_frame,
-                                     ist->pts, decoded_frame->sample_aspect_ratio);
+                                     decoded_frame->pts, decoded_frame->sample_aspect_ratio);
  
          if (!ist->filtered_frame && !(ist->filtered_frame = avcodec_alloc_frame())) {
              av_free(buffer_to_free);
@@ -1961,7 +2020,7 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
              if (ost->output_video_filter)
                  get_filtered_video_frame(ost->output_video_filter, filtered_frame, &ost->picref, &ist_pts_tb);
              if (ost->picref)
-                ist->pts = av_rescale_q(ost->picref->pts, ist_pts_tb, AV_TIME_BASE_Q);
+                filtered_frame->pts = av_rescale_q(ost->picref->pts, ist_pts_tb, AV_TIME_BASE_Q);
              if (ost->picref->video && !ost->frame_aspect_ratio)
                  ost->st->codec->sample_aspect_ratio = ost->picref->video->pixel_aspect;
  #else
@@ -2019,8 +2078,8 @@ static int output_packet(InputStream *ist,
      int64_t pkt_pts = AV_NOPTS_VALUE;
      AVPacket avpkt;
  
-    if (ist->next_pts == AV_NOPTS_VALUE)
-        ist->next_pts = ist->pts;
+    if (ist->next_dts == AV_NOPTS_VALUE)
+        ist->next_dts = ist->last_dts;
  
      if (pkt == NULL) {
          /* EOF handling */
@@ -2033,7 +2092,7 @@ static int output_packet(InputStream *ist,
      }
  
      if (pkt->dts != AV_NOPTS_VALUE)
-        ist->next_pts = ist->pts = av_rescale_q(pkt->dts, ist->st->time_base, AV_TIME_BASE_Q);
+        ist->next_dts = ist->last_dts = av_rescale_q(pkt->dts, ist->st->time_base, AV_TIME_BASE_Q);
      if (pkt->pts != AV_NOPTS_VALUE)
          pkt_pts = av_rescale_q(pkt->pts, ist->st->time_base, AV_TIME_BASE_Q);
  
@@ -2042,7 +2101,7 @@ static int output_packet(InputStream *ist,
          int ret = 0;
      handle_eof:
  
-        ist->pts = ist->next_pts;
+        ist->last_dts = ist->next_dts;
  
          if (avpkt.size && avpkt.size != pkt->size) {
              av_log(NULL, ist->showed_multi_packet_warning ? AV_LOG_VERBOSE : AV_LOG_WARNING,
@@ -2056,6 +2115,17 @@ static int output_packet(InputStream *ist,
              break;
          case AVMEDIA_TYPE_VIDEO:
              ret = transcode_video    (ist, &avpkt, &got_output, &pkt_pts);
+            if (avpkt.duration)
+                ist->next_dts += av_rescale_q(avpkt.duration, ist->st->time_base, AV_TIME_BASE_Q);
+            else if (ist->st->r_frame_rate.num)
+                ist->next_dts += av_rescale_q(1, (AVRational){ist->st->r_frame_rate.den,
+                                                              ist->st->r_frame_rate.num},
+                                              AV_TIME_BASE_Q);
+            else if (ist->st->codec->time_base.num != 0) {
+                int ticks      = ist->st->parser ? ist->st->parser->repeat_pict + 1 :
+                                                   ist->st->codec->ticks_per_frame;
+                ist->next_dts += av_rescale_q(ticks, ist->st->codec->time_base, AV_TIME_BASE_Q);
+            }
              break;
          case AVMEDIA_TYPE_SUBTITLE:
              ret = transcode_subtitles(ist, &avpkt, &got_output);
@@ -2079,16 +2149,16 @@ static int output_packet(InputStream *ist,
      /* handle stream copy */
      if (!ist->decoding_needed) {
          rate_emu_sleep(ist);
-        ist->pts = ist->next_pts;
+        ist->last_dts = ist->next_dts;
          switch (ist->st->codec->codec_type) {
          case AVMEDIA_TYPE_AUDIO:
-            ist->next_pts += ((int64_t)AV_TIME_BASE * ist->st->codec->frame_size) /
+            ist->next_dts += ((int64_t)AV_TIME_BASE * ist->st->codec->frame_size) /
                               ist->st->codec->sample_rate;
              break;
          case AVMEDIA_TYPE_VIDEO:
              if (ist->st->codec->time_base.num != 0) {
                  int ticks = ist->st->parser ? ist->st->parser->repeat_pict + 1 : ist->st->codec->ticks_per_frame;
-                ist->next_pts += ((int64_t)AV_TIME_BASE *
+                ist->next_dts += ((int64_t)AV_TIME_BASE *
                                    ist->st->codec->time_base.num * ticks) /
                                    ist->st->codec->time_base.den;
              }
@@ -2153,6 +2223,8 @@ static int init_input_stream(int ist_index, OutputStream *output_streams, int nb
              ist->st->codec->opaque         = ist;
          }
  
+        if (!av_dict_get(ist->opts, "threads", NULL, 0))
+            av_dict_set(&ist->opts, "threads", "auto", 0);
          if (avcodec_open2(ist->st->codec, codec, &ist->opts) < 0) {
              snprintf(error, error_len, "Error while opening decoder for input stream #%d:%d",
                      ist->file_index, ist->st->index);
@@ -2162,8 +2234,8 @@ static int init_input_stream(int ist_index, OutputStream *output_streams, int nb
          assert_avoptions(ist->opts);
      }
  
-    ist->pts = ist->st->avg_frame_rate.num ? - ist->st->codec->has_b_frames * AV_TIME_BASE / av_q2d(ist->st->avg_frame_rate) : 0;
-    ist->next_pts = AV_NOPTS_VALUE;
+    ist->last_dts = ist->st->avg_frame_rate.num ? - ist->st->codec->has_b_frames * AV_TIME_BASE / av_q2d(ist->st->avg_frame_rate) : 0;
+    ist->next_dts = AV_NOPTS_VALUE;
      init_pts_correction(&ist->pts_ctx);
      ist->is_start = 1;
  
@@ -2387,6 +2459,7 @@ static int transcode_init(OutputFile *output_files,
  #endif
                  break;
              case AVMEDIA_TYPE_SUBTITLE:
+                codec->time_base = (AVRational){1, 1000};
                  break;
              default:
                  abort();
@@ -2420,18 +2493,6 @@ static int transcode_init(OutputFile *output_files,
                  }
              }
          }
-        if (codec->codec_type == AVMEDIA_TYPE_VIDEO) {
-            int        size = codec->width * codec->height;
-            bit_buffer_size = FFMAX(bit_buffer_size, 6 * size + 200);
-        }
-    }
-
-    if (!bit_buffer)
-        bit_buffer = av_malloc(bit_buffer_size);
-    if (!bit_buffer) {
-        av_log(NULL, AV_LOG_ERROR, "Cannot allocate %d bytes output buffer\n",
-               bit_buffer_size);
-        return AVERROR(ENOMEM);
      }
  
      /* open each encoder */
@@ -2455,6 +2516,8 @@ static int transcode_init(OutputFile *output_files,
                  memcpy(ost->st->codec->subtitle_header, dec->subtitle_header, dec->subtitle_header_size);
                  ost->st->codec->subtitle_header_size = dec->subtitle_header_size;
              }
+            if (!av_dict_get(ost->opts, "threads", NULL, 0))
+                av_dict_set(&ost->opts, "threads", "auto", 0);
              if (avcodec_open2(ost->st->codec, codec, &ost->opts) < 0) {
                  snprintf(error, sizeof(error), "Error while opening encoder for output stream #%d:%d - maybe incorrect parameters such as bit_rate, rate, width or height",
                          ost->file_index, ost->index);
@@ -2609,7 +2672,7 @@ static int transcode(OutputFile *output_files,
                  (os->pb && avio_tell(os->pb) >= of->limit_filesize))
                  continue;
              opts = ost->st->pts.val * av_q2d(ost->st->time_base);
-            ipts = ist->pts;
+            ipts = ist->last_dts;
              if (!input_files[ist->file_index].eof_reached) {
                  if (ipts < ipts_min) {
                      ipts_min = ipts;
@@ -2682,14 +2745,14 @@ static int transcode(OutputFile *output_files,
              pkt.dts *= ist->ts_scale;
  
          //fprintf(stderr, "next:%"PRId64" dts:%"PRId64" off:%"PRId64" %d\n",
-        //        ist->next_pts,
+        //        ist->next_dts,
          //        pkt.dts, input_files[ist->file_index].ts_offset,
          //        ist->st->codec->codec_type);
-        if (pkt.dts != AV_NOPTS_VALUE && ist->next_pts != AV_NOPTS_VALUE
+        if (pkt.dts != AV_NOPTS_VALUE && ist->next_dts != AV_NOPTS_VALUE
              && (is->iformat->flags & AVFMT_TS_DISCONT)) {
              int64_t pkt_dts = av_rescale_q(pkt.dts, ist->st->time_base, AV_TIME_BASE_Q);
-            int64_t delta   = pkt_dts - ist->next_pts;
-            if ((FFABS(delta) > 1LL * dts_delta_threshold * AV_TIME_BASE || pkt_dts + 1 < ist->pts) && !copy_ts) {
+            int64_t delta   = pkt_dts - ist->next_dts;
+            if ((FFABS(delta) > 1LL * dts_delta_threshold * AV_TIME_BASE || pkt_dts + 1 < ist->last_dts) && !copy_ts) {
                  input_files[ist->file_index].ts_offset -= delta;
                  av_log(NULL, AV_LOG_DEBUG,
                         "timestamp discontinuity %"PRId64", new offset= %"PRId64"\n",
@@ -2762,7 +2825,6 @@ static int transcode(OutputFile *output_files,
      ret = 0;
  
   fail:
-    av_freep(&bit_buffer);
      av_freep(&no_packet);
  
      if (output_streams) {
@@ -3072,7 +3134,7 @@ static AVCodec *choose_decoder(OptionsContext *o, AVFormatContext *s, AVStream *
   */
  static void add_input_streams(OptionsContext *o, AVFormatContext *ic)
  {
-    int i, rfps, rfps_base;
+    int i;
  
      for (i = 0; i < ic->nb_streams; i++) {
          AVStream *st = ic->streams[i];
@@ -3097,21 +3159,12 @@ static void add_input_streams(OptionsContext *o, AVFormatContext *ic)
                  st->discard = AVDISCARD_ALL;
              break;
          case AVMEDIA_TYPE_VIDEO:
-            rfps      = ic->streams[i]->r_frame_rate.num;
-            rfps_base = ic->streams[i]->r_frame_rate.den;
              if (dec->lowres) {
                  dec->flags |= CODEC_FLAG_EMU_EDGE;
                  dec->height >>= dec->lowres;
                  dec->width  >>= dec->lowres;
              }
  
-            if (dec->time_base.den != rfps * dec->ticks_per_frame || dec->time_base.num != rfps_base) {
-
-                av_log(NULL, AV_LOG_INFO,"\nSeems stream %d codec frame rate differs from container frame rate: %2.2f (%d/%d) -> %2.2f (%d/%d)\n",
-                       i, (float)dec->time_base.den / dec->time_base.num, dec->time_base.den, dec->time_base.num,
-                       (float)rfps / rfps_base, rfps, rfps_base);
-            }
-
              if (o->video_disable)
                  st->discard = AVDISCARD_ALL;
              else if (video_discard)
@@ -3612,13 +3665,13 @@ static OutputStream *new_video_stream(OptionsContext *o, AVFormatContext *oc)
          ost->top_field_first = -1;
          MATCH_PER_STREAM_OPT(top_field_first, i, ost->top_field_first, oc, st);
  
-        MATCH_PER_STREAM_OPT(copy_initial_nonkeyframes, i, ost->copy_initial_nonkeyframes, oc ,st);
-
  #if CONFIG_AVFILTER
          MATCH_PER_STREAM_OPT(filters, str, filters, oc, st);
          if (filters)
              ost->avfilter = av_strdup(filters);
  #endif
+    } else {
+        MATCH_PER_STREAM_OPT(copy_initial_nonkeyframes, i, ost->copy_initial_nonkeyframes, oc ,st);
      }
  
      return ost;
@@ -4308,6 +4361,24 @@ static int opt_video_filters(OptionsContext *o, const char *opt, const char *arg
      return parse_option(o, "filter:v", arg, options);
  }
  
+static int opt_vsync(const char *opt, const char *arg)
+{
+    if      (!av_strcasecmp(arg, "cfr"))         video_sync_method = VSYNC_CFR;
+    else if (!av_strcasecmp(arg, "vfr"))         video_sync_method = VSYNC_VFR;
+    else if (!av_strcasecmp(arg, "passthrough")) video_sync_method = VSYNC_PASSTHROUGH;
+
+    if (video_sync_method == VSYNC_AUTO)
+        video_sync_method = parse_number_or_die("vsync", arg, OPT_INT, VSYNC_AUTO, VSYNC_VFR);
+    return 0;
+}
+
+static int opt_deinterlace(const char *opt, const char *arg)
+{
+    av_log(NULL, AV_LOG_WARNING, "-%s is deprecated, use -filter:v yadif instead\n", opt);
+    do_deinterlace = 1;
+    return 0;
+}
+
  #define OFFSET(x) offsetof(OptionsContext, x)
  static const OptionDef options[] = {
      /* main options */
@@ -4338,7 +4409,7 @@ static const OptionDef options[] = {
        "when dumping packets, also dump the payload" },
      { "re", OPT_BOOL | OPT_EXPERT | OPT_OFFSET, {.off = OFFSET(rate_emu)}, "read input at native frame rate", "" },
      { "target", HAS_ARG | OPT_FUNC2, {(void*)opt_target}, "specify target file type (\"vcd\", \"svcd\", \"dvd\", \"dv\", \"dv50\", \"pal-vcd\", \"ntsc-svcd\", ...)", "type" },
-    { "vsync", HAS_ARG | OPT_INT | OPT_EXPERT, {(void*)&video_sync_method}, "video sync method", "" },
+    { "vsync", HAS_ARG | OPT_EXPERT, {(void*)opt_vsync}, "video sync method", "" },
      { "async", HAS_ARG | OPT_INT | OPT_EXPERT, {(void*)&audio_sync_method}, "audio sync method", "" },
      { "adrift_threshold", HAS_ARG | OPT_FLOAT | OPT_EXPERT, {(void*)&audio_drift_threshold}, "audio drift threshold", "threshold" },
      { "copyts", OPT_BOOL | OPT_EXPERT, {(void*)&copy_ts}, "copy timestamps" },
@@ -4372,8 +4443,8 @@ static const OptionDef options[] = {
        "use same quantizer as source (implies VBR)" },
      { "pass", HAS_ARG | OPT_VIDEO, {(void*)opt_pass}, "select the pass number (1 or 2)", "n" },
      { "passlogfile", HAS_ARG | OPT_STRING | OPT_VIDEO, {(void*)&pass_logfilename_prefix}, "select two pass log file name prefix", "prefix" },
-    { "deinterlace", OPT_BOOL | OPT_EXPERT | OPT_VIDEO, {(void*)&do_deinterlace},
-      "deinterlace pictures" },
+    { "deinterlace", OPT_EXPERT | OPT_VIDEO, {(void*)opt_deinterlace},
+      "this option is deprecated, use the yadif filter instead" },
      { "vstats", OPT_EXPERT | OPT_VIDEO, {(void*)&opt_vstats}, "dump video coding statistics to file" },
      { "vstats_file", HAS_ARG | OPT_EXPERT | OPT_VIDEO, {(void*)opt_vstats_file}, "dump video coding statistics to file", "file" },
  #if CONFIG_AVFILTER