ffmpeg: fix codecids with ffserver + ffmpeg + ffm

[ffmpeg] / ffmpeg.c
diff --git a/ffmpeg.c b/ffmpeg.c

index fb30c8e0c0b9253f0946c3730cf122ec291cceb4..9154f3cb4adb26176ef654898f90220821ccd094 100644 (file)
--- a/ffmpeg.c
+++ b/ffmpeg.c
@@ -168,7 +168,6 @@ static uint8_t *audio_buf;
  static uint8_t *audio_out;
  static unsigned int allocated_audio_out_size, allocated_audio_buf_size;
  
-static void *samples;
  static uint8_t *input_tmp= NULL;
  
  #define DEFAULT_PASS_LOGFILENAME_PREFIX "ffmpeg2pass"
@@ -179,6 +178,8 @@ typedef struct InputStream {
      int discard;             /* true if stream data should be discarded */
      int decoding_needed;     /* true if the packets must be decoded in 'raw_fifo' */
      AVCodec *dec;
+    AVFrame *decoded_frame;
+    AVFrame *filtered_frame;
  
      int64_t       start;     /* time when read started */
      int64_t       next_pts;  /* synthetic pts for cases where pkt.pts
@@ -658,8 +659,11 @@ void av_noreturn exit_program(int ret)
      for(i=0;i<nb_input_files;i++) {
          av_close_input_file(input_files[i].ctx);
      }
-    for (i = 0; i < nb_input_streams; i++)
+    for (i = 0; i < nb_input_streams; i++) {
+        av_freep(&input_streams[i].decoded_frame);
+        av_freep(&input_streams[i].filtered_frame);
          av_dict_free(&input_streams[i].opts);
+    }
  
      if (vstats_file)
          fclose(vstats_file);
@@ -674,7 +678,6 @@ void av_noreturn exit_program(int ret)
      av_free(audio_buf);
      av_free(audio_out);
      allocated_audio_buf_size= allocated_audio_out_size= 0;
-    av_free(samples);
  
  #if CONFIG_AVFILTER
      avfilter_uninit();
@@ -764,6 +767,8 @@ static void choose_pixel_fmt(AVStream *st, AVCodec *codec)
  {
      if(codec && codec->pix_fmts){
          const enum PixelFormat *p= codec->pix_fmts;
+        int has_alpha= av_pix_fmt_descriptors[st->codec->pix_fmt].nb_components % 2 == 0;
+        enum PixelFormat best= PIX_FMT_NONE;
          if(st->codec->strict_std_compliance <= FF_COMPLIANCE_UNOFFICIAL){
              if(st->codec->codec_id==CODEC_ID_MJPEG){
                  p= (const enum PixelFormat[]){PIX_FMT_YUVJ420P, PIX_FMT_YUVJ422P, PIX_FMT_YUV420P, PIX_FMT_YUV422P, PIX_FMT_NONE};
@@ -772,6 +777,7 @@ static void choose_pixel_fmt(AVStream *st, AVCodec *codec)
              }
          }
          for (; *p != PIX_FMT_NONE; p++) {
+            best= avcodec_find_best_pix_fmt2(best, *p, st->codec->pix_fmt, has_alpha, NULL);
              if(*p == st->codec->pix_fmt)
                  break;
          }
@@ -781,8 +787,8 @@ static void choose_pixel_fmt(AVStream *st, AVCodec *codec)
                          "Incompatible pixel format '%s' for codec '%s', auto-selecting format '%s'\n",
                          av_pix_fmt_descriptors[st->codec->pix_fmt].name,
                          codec->name,
-                        av_pix_fmt_descriptors[codec->pix_fmts[0]].name);
-            st->codec->pix_fmt = codec->pix_fmts[0];
+                        av_pix_fmt_descriptors[best].name);
+            st->codec->pix_fmt = best;
          }
      }
  }
@@ -835,14 +841,11 @@ static void generate_silence(uint8_t* buf, enum AVSampleFormat sample_fmt, size_
      memset(buf, fill_char, size);
  }
  
-static void do_audio_out(AVFormatContext *s,
-                         OutputStream *ost,
-                         InputStream *ist,
-                         unsigned char *buf, int size)
+static void do_audio_out(AVFormatContext *s, OutputStream *ost,
+                         InputStream *ist, AVFrame *decoded_frame)
  {
      uint8_t *buftmp;
      int64_t audio_out_size, audio_buf_size;
-    int64_t allocated_for_size= size;
  
      int size_out, frame_bytes, ret, resample_changed;
      AVCodecContext *enc= ost->st->codec;
@@ -850,6 +853,9 @@ static void do_audio_out(AVFormatContext *s,
      int osize = av_get_bytes_per_sample(enc->sample_fmt);
      int isize = av_get_bytes_per_sample(dec->sample_fmt);
      const int coded_bps = av_get_bits_per_sample(enc->codec->id);
+    uint8_t *buf = decoded_frame->data[0];
+    int size     = decoded_frame->nb_samples * dec->channels * isize;
+    int64_t allocated_for_size = size;
  
  need_realloc:
      audio_buf_size= (allocated_for_size + isize*dec->channels - 1) / (isize*dec->channels);
@@ -876,7 +882,9 @@ need_realloc:
      }
  
      if (enc->channels != dec->channels
-     || enc->sample_fmt != dec->sample_fmt)
+     || enc->sample_fmt != dec->sample_fmt
+     || enc->sample_rate!= dec->sample_rate
+    )
          ost->audio_resample = 1;
  
      resample_changed = ost->resample_sample_fmt  != dec->sample_fmt ||
@@ -1293,7 +1301,8 @@ static void do_video_out(AVFormatContext *s,
          av_init_packet(&pkt);
          pkt.stream_index= ost->index;
  
-        if (s->oformat->flags & AVFMT_RAWPICTURE) {
+        if (s->oformat->flags & AVFMT_RAWPICTURE &&
+            enc->codec->id == CODEC_ID_RAWVIDEO) {
              /* raw pictures are written as AVPicture structure to
                 avoid any copies. We support temporarily the older
                 method. */
@@ -1558,7 +1567,7 @@ static void flush_encoders(OutputStream *ost_table, int nb_ostreams)
  
          if (ost->st->codec->codec_type == AVMEDIA_TYPE_AUDIO && enc->frame_size <=1)
              continue;
-        if (ost->st->codec->codec_type == AVMEDIA_TYPE_VIDEO && (os->oformat->flags & AVFMT_RAWPICTURE))
+        if (ost->st->codec->codec_type == AVMEDIA_TYPE_VIDEO && (os->oformat->flags & AVFMT_RAWPICTURE) && enc->codec->id == CODEC_ID_RAWVIDEO)
              continue;
  
          for(;;) {
@@ -1726,39 +1735,42 @@ static void rate_emu_sleep(InputStream *ist)
  
  static int transcode_audio(InputStream *ist, AVPacket *pkt, int *got_output)
  {
-    static unsigned int samples_size = 0;
+    AVFrame *decoded_frame;
+    AVCodecContext *avctx = ist->st->codec;
      int bps = av_get_bytes_per_sample(ist->st->codec->sample_fmt);
-    uint8_t *decoded_data_buf  = NULL;
-    int      decoded_data_size = 0;
      int i, ret;
  
-    if (pkt && samples_size < FFMAX(pkt->size * bps, AVCODEC_MAX_AUDIO_FRAME_SIZE)) {
-        av_free(samples);
-        samples_size = FFMAX(pkt->size * bps, AVCODEC_MAX_AUDIO_FRAME_SIZE);
-        samples      = av_malloc(samples_size);
-    }
-    decoded_data_size = samples_size;
+    if (!ist->decoded_frame && !(ist->decoded_frame = avcodec_alloc_frame()))
+        return AVERROR(ENOMEM);
+    else
+        avcodec_get_frame_defaults(ist->decoded_frame);
+    decoded_frame = ist->decoded_frame;
  
-    ret = avcodec_decode_audio3(ist->st->codec, samples, &decoded_data_size,
-                                pkt);
-    if (ret < 0)
+    ret = avcodec_decode_audio4(avctx, decoded_frame, got_output, pkt);
+    if (ret < 0) {
          return ret;
-    *got_output  = decoded_data_size > 0;
+    }
  
-    /* Some bug in mpeg audio decoder gives */
-    /* decoded_data_size < 0, it seems they are overflows */
      if (!*got_output) {
          /* no audio frame */
          return ret;
      }
  
-    decoded_data_buf = (uint8_t *)samples;
-    ist->next_pts   += ((int64_t)AV_TIME_BASE/bps * decoded_data_size) /
-                       (ist->st->codec->sample_rate * ist->st->codec->channels);
+    /* if the decoder provides a pts, use it instead of the last packet pts.
+       the decoder could be delaying output by a packet or more. */
+    if (decoded_frame->pts != AV_NOPTS_VALUE)
+        ist->next_pts = decoded_frame->pts;
+
+    /* increment next_pts to use for the case where the input stream does not
+       have timestamps or there are multiple frames in the packet */
+    ist->next_pts += ((int64_t)AV_TIME_BASE * decoded_frame->nb_samples) /
+                     avctx->sample_rate;
  
      // preprocess audio (volume)
      if (audio_volume != 256) {
-        switch (ist->st->codec->sample_fmt) {
+        int decoded_data_size = decoded_frame->nb_samples * avctx->channels * bps;
+        void *samples = decoded_frame->data[0];
+        switch (avctx->sample_fmt) {
          case AV_SAMPLE_FMT_U8:
          {
              uint8_t *volp = samples;
@@ -1819,9 +1831,9 @@ static int transcode_audio(InputStream *ist, AVPacket *pkt, int *got_output)
  
          if (!check_output_constraints(ist, ost) || !ost->encoding_needed)
              continue;
-        do_audio_out(output_files[ost->file_index].ctx, ost, ist,
-                     decoded_data_buf, decoded_data_size);
+        do_audio_out(output_files[ost->file_index].ctx, ost, ist, decoded_frame);
      }
+
      return ret;
  }
  
@@ -1834,57 +1846,60 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
  #if CONFIG_AVFILTER
      int frame_available = 1;
  #endif
+    int duration=0;
+    int64_t *best_effort_timestamp;
+    AVRational *frame_sample_aspect;
  
-    if (!(decoded_frame = avcodec_alloc_frame()))
+    if (!ist->decoded_frame && !(ist->decoded_frame = avcodec_alloc_frame()))
          return AVERROR(ENOMEM);
+    else
+        avcodec_get_frame_defaults(ist->decoded_frame);
+    decoded_frame = ist->decoded_frame;
      pkt->pts  = *pkt_pts;
      pkt->dts  = *pkt_dts;
      *pkt_pts  = AV_NOPTS_VALUE;
  
-    if (*pkt_dts != AV_NOPTS_VALUE && pkt->duration) {
-         *pkt_dts += av_rescale_q(pkt->duration, ist->st->time_base, AV_TIME_BASE_Q);
-    } else if(*pkt_dts != AV_NOPTS_VALUE && ist->st->codec->time_base.num != 0) {
+    if (pkt->duration) {
+        duration = av_rescale_q(pkt->duration, ist->st->time_base, AV_TIME_BASE_Q);
+    } else if(ist->st->codec->time_base.num != 0) {
          int ticks= ist->st->parser ? ist->st->parser->repeat_pict+1 : ist->st->codec->ticks_per_frame;
-        *pkt_dts += ((int64_t)AV_TIME_BASE *
+        duration = ((int64_t)AV_TIME_BASE *
                            ist->st->codec->time_base.num * ticks) /
-            ist->st->codec->time_base.den;
+                          ist->st->codec->time_base.den;
+    }
+
+    if(*pkt_dts != AV_NOPTS_VALUE && duration) {
+        *pkt_dts += duration;
      }else
          *pkt_dts = AV_NOPTS_VALUE;
  
      ret = avcodec_decode_video2(ist->st->codec,
                                  decoded_frame, got_output, pkt);
      if (ret < 0)
-        goto fail;
+        return ret;
  
      quality = same_quant ? decoded_frame->quality : 0;
      if (!*got_output) {
          /* no picture yet */
-        av_freep(&decoded_frame);
          return ret;
      }
  
-    if(decoded_frame->best_effort_timestamp != AV_NOPTS_VALUE)
-        ist->next_pts = ist->pts = decoded_frame->best_effort_timestamp;
+    best_effort_timestamp= av_opt_ptr(avcodec_get_frame_class(), decoded_frame, "best_effort_timestamp");
+    if(*best_effort_timestamp != AV_NOPTS_VALUE)
+        ist->next_pts = ist->pts = *best_effort_timestamp;
  
-    if (pkt->duration)
-        ist->next_pts += av_rescale_q(pkt->duration, ist->st->time_base, AV_TIME_BASE_Q);
-    else if (ist->st->codec->time_base.num != 0) {
-        int ticks      = ist->st->parser ? ist->st->parser->repeat_pict + 1 :
-                                           ist->st->codec->ticks_per_frame;
-        ist->next_pts += ((int64_t)AV_TIME_BASE *
-                          ist->st->codec->time_base.num * ticks) /
-                          ist->st->codec->time_base.den;
-    }
+    ist->next_pts += duration;
      pkt->size = 0;
  
      pre_process_video_frame(ist, (AVPicture *)decoded_frame, &buffer_to_free);
  
  #if CONFIG_AVFILTER
+    frame_sample_aspect= av_opt_ptr(avcodec_get_frame_class(), decoded_frame, "sample_aspect_ratio");
      for(i=0;i<nb_output_streams;i++) {
          OutputStream *ost = ost = &output_streams[i];
          if(check_output_constraints(ist, ost)){
-            if (!decoded_frame->sample_aspect_ratio.num)
-                decoded_frame->sample_aspect_ratio = ist->st->sample_aspect_ratio;
+            if (!frame_sample_aspect->num)
+                *frame_sample_aspect = ist->st->sample_aspect_ratio;
              decoded_frame->pts = ist->pts;
  
              av_vsrc_buffer_add_frame(ost->input_video_filter, decoded_frame, AV_VSRC_BUF_FLAG_OVERWRITE);
@@ -1903,17 +1918,21 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
  
  #if CONFIG_AVFILTER
          if (ost->input_video_filter) {
-            frame_available = avfilter_poll_frame(ost->output_video_filter->inputs[0]);
+            frame_available = av_buffersink_poll_frame(ost->output_video_filter);
          }
          while (frame_available) {
              if (ost->output_video_filter) {
                  AVRational ist_pts_tb = ost->output_video_filter->inputs[0]->time_base;
-                if (av_buffersink_get_buffer_ref(ost->output_video_filter, &ost->picref, 0) < 0)
+                if (av_buffersink_get_buffer_ref(ost->output_video_filter, &ost->picref, 0) < 0){
+                    av_log(0, AV_LOG_WARNING, "AV Filter told us it has a frame available but failed to output one\n");
                      goto cont;
-                if (!filtered_frame && !(filtered_frame = avcodec_alloc_frame())) {
-                    ret = AVERROR(ENOMEM);
-                    goto fail;
                  }
+                if (!ist->filtered_frame && !(ist->filtered_frame = avcodec_alloc_frame())) {
+                    av_free(buffer_to_free);
+                    return AVERROR(ENOMEM);
+                } else
+                    avcodec_get_frame_defaults(ist->filtered_frame);
+                filtered_frame = ist->filtered_frame;
                  *filtered_frame= *decoded_frame; //for me_threshold
                  if (ost->picref) {
                      avfilter_fill_frame_from_video_buffer_ref(filtered_frame, ost->picref);
@@ -1932,16 +1951,13 @@ static int transcode_video(InputStream *ist, AVPacket *pkt, int *got_output, int
                  do_video_stats(output_files[ost->file_index].ctx, ost, frame_size);
  #if CONFIG_AVFILTER
              cont:
-            frame_available = ost->output_video_filter && avfilter_poll_frame(ost->output_video_filter->inputs[0]);
+            frame_available = ost->output_video_filter && av_buffersink_poll_frame(ost->output_video_filter);
              avfilter_unref_buffer(ost->picref);
          }
-        av_freep(&filtered_frame);
  #endif
      }
  
-fail:
      av_free(buffer_to_free);
-    av_freep(&decoded_frame);
      return ret;
  }
  
@@ -2053,8 +2069,10 @@ static int output_packet(InputStream *ist,
                               ist->st->codec->sample_rate;
              break;
          case AVMEDIA_TYPE_VIDEO:
-            if (ist->st->codec->time_base.num != 0) {
-                int ticks = ist->st->parser ? ist->st->parser->repeat_pict+1 : ist->st->codec->ticks_per_frame;
+            if (pkt->duration) {
+                ist->next_pts += av_rescale_q(pkt->duration, ist->st->time_base, AV_TIME_BASE_Q);
+            } else if(ist->st->codec->time_base.num != 0) {
+                int ticks= ist->st->parser ? ist->st->parser->repeat_pict+1 : ist->st->codec->ticks_per_frame;
                  ist->next_pts += ((int64_t)AV_TIME_BASE *
                                    ist->st->codec->time_base.num * ticks) /
                                    ist->st->codec->time_base.den;
@@ -2200,7 +2218,10 @@ static int transcode_init(OutputFile *output_files, int nb_output_files,
                      codec->time_base.num *= icodec->ticks_per_frame;
                      codec->time_base.den *= 2;
                  }
-            } else if(!(oc->oformat->flags & AVFMT_VARIABLE_FPS)) {
+            } else if(!(oc->oformat->flags & AVFMT_VARIABLE_FPS)
+                      && strcmp(oc->oformat->name, "mov") && strcmp(oc->oformat->name, "mp4") && strcmp(oc->oformat->name, "3gp")
+                      && strcmp(oc->oformat->name, "3g2") && strcmp(oc->oformat->name, "psp") && strcmp(oc->oformat->name, "ipod")
+            ) {
                  if(   copy_tb<0 && av_q2d(icodec->time_base)*icodec->ticks_per_frame > av_q2d(ist->st->time_base)
                                  && av_q2d(ist->st->time_base) < 1.0/500
                     || copy_tb==0){
@@ -3244,6 +3265,8 @@ static void add_input_streams(OptionsContext *o, AVFormatContext *ic)
                  st->discard= video_discard;
              break;
          case AVMEDIA_TYPE_DATA:
+            if (o->data_disable)
+                st->discard= AVDISCARD_ALL;
              break;
          case AVMEDIA_TYPE_SUBTITLE:
              if(!ist->dec)
@@ -3372,11 +3395,14 @@ static int opt_input_file(OptionsContext *o, const char *opt, const char *filena
      ic->interrupt_callback = int_cb;
  
      if (loop_input) {
-        av_log(NULL, AV_LOG_WARNING, "-loop_input is deprecated, use -loop 1\n");
+        av_log(NULL, AV_LOG_WARNING,
+            "-loop_input is deprecated, use -loop 1\n"
+            "Note, both loop options only work with -f image2\n"
+        );
          ic->loop_input = loop_input;
      }
  
-    /* open the input file with generic libav function */
+    /* open the input file with generic avformat function */
      err = avformat_open_input(&ic, filename, file_iformat, &format_opts);
      if (err < 0) {
          print_error(filename, err);
@@ -3936,6 +3962,7 @@ static int read_ffserver_streams(OptionsContext *o, AVFormatContext *s, const ch
          ost   = new_output_stream(o, s, codec->type);
          st    = ost->st;
          avctx = st->codec;
+        ost->enc = codec;
  
          // FIXME: a more elegant solution is needed
          memcpy(st, ic->streams[i], sizeof(AVStream));
@@ -4061,6 +4088,8 @@ static void opt_output_file(void *optctx, const char *filename)
                  continue;
              if(o->   video_disable && ist->st->codec->codec_type == AVMEDIA_TYPE_VIDEO)
                  continue;
+            if(o->    data_disable && ist->st->codec->codec_type == AVMEDIA_TYPE_DATA)
+                continue;
  
              switch (ist->st->codec->codec_type) {
              case AVMEDIA_TYPE_VIDEO:    ost = new_video_stream(o, oc);    break;
@@ -4134,7 +4163,7 @@ static void opt_output_file(void *optctx, const char *filename)
      }
  
      if (!(oc->oformat->flags & AVFMT_NOFILE)) {
-        /* test if it already exists to avoid loosing precious files */
+        /* test if it already exists to avoid losing precious files */
          assert_file_overwrite(filename);
  
          /* open the file */
@@ -4668,7 +4697,7 @@ static const OptionDef options[] = {
      { "async", HAS_ARG | OPT_INT | OPT_EXPERT, {(void*)&audio_sync_method}, "audio sync method", "" },
      { "adrift_threshold", HAS_ARG | OPT_FLOAT | OPT_EXPERT, {(void*)&audio_drift_threshold}, "audio drift threshold", "threshold" },
      { "copyts", OPT_BOOL | OPT_EXPERT, {(void*)&copy_ts}, "copy timestamps" },
-    { "copytb", HAS_ARG | OPT_INT | OPT_EXPERT, {(void*)&copy_tb}, "copy input stream time base when stream copying" },
+    { "copytb", HAS_ARG | OPT_INT | OPT_EXPERT, {(void*)&copy_tb}, "copy input stream time base when stream copying", "source" },
      { "shortest", OPT_BOOL | OPT_EXPERT, {(void*)&opt_shortest}, "finish encoding within shortest input" }, //
      { "dts_delta_threshold", HAS_ARG | OPT_FLOAT | OPT_EXPERT, {(void*)&dts_delta_threshold}, "timestamp discontinuity delta threshold", "threshold" },
      { "xerror", OPT_BOOL, {(void*)&exit_on_error}, "exit on error", "error" },
@@ -4765,6 +4794,7 @@ static const OptionDef options[] = {
      { "fpre", HAS_ARG | OPT_EXPERT| OPT_FUNC2, {(void*)opt_preset}, "set options from indicated preset file", "filename" },
      /* data codec support */
      { "dcodec", HAS_ARG | OPT_DATA | OPT_FUNC2, {(void*)opt_data_codec}, "force data codec ('copy' to copy stream)", "codec" },
+    { "dn", OPT_BOOL | OPT_VIDEO | OPT_OFFSET, {.off = OFFSET(data_disable)}, "disable data" },
  
      { "default", HAS_ARG | OPT_AUDIO | OPT_VIDEO | OPT_EXPERT, {(void*)opt_default}, "generic catch all option", "" },
      { NULL, },