git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/muxer/frame_muxer.cpp

   1 /*
   2 * Copyright (c) 2011 Sveriges Television AB <info@casparcg.com>
   3 *
   4 * This file is part of CasparCG (www.casparcg.com).
   5 *
   6 * CasparCG is free software: you can redistribute it and/or modify
   7 * it under the terms of the GNU General Public License as published by
   8 * the Free Software Foundation, either version 3 of the License, or
   9 * (at your option) any later version.
  10 *
  11 * CasparCG is distributed in the hope that it will be useful,
  12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 * GNU General Public License for more details.
  15 *
  16 * You should have received a copy of the GNU General Public License
  17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.
  18 *
  19 * Author: Robert Nagy, ronag89@gmail.com
  20 */
  21
  22 #include "../../StdAfx.h"
  23
  24 #include "frame_muxer.h"
  25
  26 #include "../filter/filter.h"
  27 #include "../util/util.h"
  28 #include "../../ffmpeg.h"
  29
  30 #include <core/producer/frame_producer.h>
  31 #include <core/frame/draw_frame.h>
  32 #include <core/frame/frame_transform.h>
  33 #include <core/frame/pixel_format.h>
  34 #include <core/frame/frame_factory.h>
  35 #include <core/frame/frame.h>
  36 #include <core/frame/audio_channel_layout.h>
  37
  38 #include <common/env.h>
  39 #include <common/except.h>
  40 #include <common/log.h>
  41
  42 #if defined(_MSC_VER)
  43 #pragma warning (push)
  44 #pragma warning (disable : 4244)
  45 #endif
  46 extern "C"
  47 {
  48         #define __STDC_CONSTANT_MACROS
  49         #define __STDC_LIMIT_MACROS
  50         #include <libavcodec/avcodec.h>
  51         #include <libavformat/avformat.h>
  52 }
  53 #if defined(_MSC_VER)
  54 #pragma warning (pop)
  55 #endif
  56
  57 #include <common/assert.h>
  58 #include <boost/range/algorithm_ext/push_back.hpp>
  59 #include <boost/algorithm/string/predicate.hpp>
  60
  61 #include <deque>
  62 #include <queue>
  63 #include <vector>
  64
  65 using namespace caspar::core;
  66
  67 namespace caspar { namespace ffmpeg {
  68
  69 bool is_frame_format_changed(const AVFrame& lhs, const AVFrame& rhs)
  70 {
  71         if (lhs.format != rhs.format)
  72                 return true;
  73
  74         for (int i = 0; i < AV_NUM_DATA_POINTERS; ++i)
  75         {
  76                 if (lhs.linesize[i] != rhs.linesize[i])
  77                         return true;
  78         }
  79
  80         return false;
  81 }
  82
  83 struct frame_muxer::impl : boost::noncopyable
  84 {
  85         std::queue<core::mutable_frame>                                 video_stream_;
  86         core::mutable_audio_buffer                                              audio_stream_;
  87         std::queue<draw_frame>                                                  frame_buffer_;
  88         display_mode                                                                    display_mode_                   = display_mode::invalid;
  89         const double                                                                    in_fps_;
  90         const video_format_desc                                                 format_desc_;
  91         audio_channel_layout                                                    channel_layout_;
  92
  93         std::vector<int>                                                                audio_cadence_                  = format_desc_.audio_cadence;
  94
  95         spl::shared_ptr<core::frame_factory>                    frame_factory_;
  96         std::shared_ptr<AVFrame>                                                previous_frame_;
  97
  98         std::unique_ptr<filter>                                                 filter_;
  99         const std::wstring                                                              filter_str_;
 100         bool                                                                                    force_deinterlacing_    = env::properties().get(L"configuration.force-deinterlace", true);
 101
 102         impl(
 103                         double in_fps,
 104                         const spl::shared_ptr<core::frame_factory>& frame_factory,
 105                         const core::video_format_desc& format_desc,
 106                         const core::audio_channel_layout& channel_layout,
 107                         const std::wstring& filter_str)
 108                 : in_fps_(in_fps)
 109                 , format_desc_(format_desc)
 110                 , channel_layout_(channel_layout)
 111                 , frame_factory_(frame_factory)
 112                 , filter_str_(filter_str)
 113         {
 114                 // Note: Uses 1 step rotated cadence for 1001 modes (1602, 1602, 1601, 1602, 1601)
 115                 // This cadence fills the audio mixer most optimally.
 116                 boost::range::rotate(audio_cadence_, std::end(audio_cadence_)-1);
 117         }
 118
 119         void push_video(const std::shared_ptr<AVFrame>& video)
 120         {
 121                 if(!video)
 122                         return;
 123
 124                 if (previous_frame_ && video->data[0] && is_frame_format_changed(*previous_frame_, *video))
 125                 {
 126                         // Fixes bug where avfilter crashes server on some DV files (starts in YUV420p but changes to YUV411p after the first frame).
 127                         if (!ffmpeg::is_logging_disabled_for_thread())
 128                                 CASPAR_LOG(info) << L"[frame_muxer] Frame format has changed. Resetting display mode.";
 129                         display_mode_ = display_mode::invalid;
 130                 }
 131
 132                 if(!video->data[0])
 133                 {
 134                         auto empty_frame = frame_factory_->create_frame(this, core::pixel_format_desc(core::pixel_format::invalid), channel_layout_);
 135                         video_stream_.push(std::move(empty_frame));
 136                         display_mode_ = display_mode::simple;
 137                 }
 138                 else
 139                 {
 140                         if(!filter_ || display_mode_ == display_mode::invalid)
 141                                 update_display_mode(video);
 142
 143                         filter_->push(video);
 144                         previous_frame_ = video;
 145                         for (auto& av_frame : filter_->poll_all())
 146                                 video_stream_.push(make_frame(this, av_frame, format_desc_.fps, *frame_factory_, channel_layout_));
 147                 }
 148
 149                 merge();
 150         }
 151
 152         void push_audio(const std::shared_ptr<AVFrame>& audio)
 153         {
 154                 if(!audio)
 155                         return;
 156
 157                 if(!audio->data[0])
 158                 {
 159                         if (channel_layout_ == core::audio_channel_layout::invalid())
 160                                 channel_layout_ = *core::audio_channel_layout_repository::get_default()->get_layout(L"stereo");
 161
 162                         boost::range::push_back(audio_stream_, core::mutable_audio_buffer(audio_cadence_.front() * channel_layout_.num_channels, 0));
 163                 }
 164                 else
 165                 {
 166                         auto ptr = reinterpret_cast<int32_t*>(audio->data[0]);
 167                         audio_stream_.insert(audio_stream_.end(), ptr, ptr + audio->linesize[0]/sizeof(int32_t));
 168                 }
 169
 170                 merge();
 171         }
 172
 173         bool video_ready() const
 174         {
 175                 switch(display_mode_)
 176                 {
 177                 case display_mode::deinterlace_bob_reinterlace:
 178                 case display_mode::interlace:
 179                 case display_mode::half:
 180                         return video_stream_.size() >= 2;
 181                 default:
 182                         return video_stream_.size() >= 1;
 183                 }
 184         }
 185
 186         bool audio_ready() const
 187         {
 188                 switch(display_mode_)
 189                 {
 190                 case display_mode::duplicate:
 191                         return audio_stream_.size() >= static_cast<size_t>(audio_cadence_[0] + audio_cadence_[1 % audio_cadence_.size()]) * channel_layout_.num_channels;
 192                 default:
 193                         return audio_stream_.size() >= static_cast<size_t>(audio_cadence_.front()) * channel_layout_.num_channels;
 194                 }
 195         }
 196
 197         bool empty() const
 198         {
 199                 return frame_buffer_.empty();
 200         }
 201
 202         core::draw_frame front() const
 203         {
 204                 return frame_buffer_.front();
 205         }
 206
 207         void pop()
 208         {
 209                 frame_buffer_.pop();
 210         }
 211
 212         void merge()
 213         {
 214                 while(video_ready() && audio_ready() && display_mode_ != display_mode::invalid)
 215                 {
 216                         auto frame1                     = pop_video();
 217                         frame1.audio_data()     = pop_audio();
 218
 219                         switch(display_mode_)
 220                         {
 221                         case display_mode::simple:
 222                         case display_mode::deinterlace_bob:
 223                         case display_mode::deinterlace:
 224                                 {
 225                                         frame_buffer_.push(core::draw_frame(std::move(frame1)));
 226                                         break;
 227                                 }
 228                         case display_mode::interlace:
 229                         case display_mode::deinterlace_bob_reinterlace:
 230                                 {
 231                                         auto frame2 = pop_video();
 232
 233                                         frame_buffer_.push(core::draw_frame::interlace(
 234                                                 core::draw_frame(std::move(frame1)),
 235                                                 core::draw_frame(std::move(frame2)),
 236                                                 format_desc_.field_mode));
 237                                         break;
 238                                 }
 239                         case display_mode::duplicate:
 240                                 {
 241                                         //boost::range::push_back(frame1.audio_data(), pop_audio());
 242
 243                                         auto second_audio_frame = core::mutable_frame(
 244                                                         std::vector<array<std::uint8_t>>(),
 245                                                         pop_audio(),
 246                                                         frame1.stream_tag(),
 247                                                         core::pixel_format_desc(),
 248                                                         channel_layout_);
 249                                         auto first_frame = core::draw_frame(std::move(frame1));
 250                                         auto muted_first_frame = core::draw_frame(first_frame);
 251                                         muted_first_frame.transform().audio_transform.volume = 0;
 252                                         auto second_frame = core::draw_frame({ core::draw_frame(std::move(second_audio_frame)), muted_first_frame });
 253
 254                                         // Same video but different audio.
 255                                         frame_buffer_.push(first_frame);
 256                                         frame_buffer_.push(second_frame);
 257                                         break;
 258                                 }
 259                         case display_mode::half:
 260                                 {
 261                                         pop_video(); // Throw away
 262
 263                                         frame_buffer_.push(core::draw_frame(std::move(frame1)));
 264                                         break;
 265                                 }
 266                         default:
 267                                 CASPAR_THROW_EXCEPTION(invalid_operation());
 268                         }
 269                 }
 270         }
 271
 272         core::mutable_frame pop_video()
 273         {
 274                 auto frame = std::move(video_stream_.front());
 275                 video_stream_.pop();
 276                 return std::move(frame);
 277         }
 278
 279         core::mutable_audio_buffer pop_audio()
 280         {
 281                 if (audio_stream_.size() < audio_cadence_.front() * channel_layout_.num_channels)
 282                         CASPAR_THROW_EXCEPTION(out_of_range());
 283
 284                 auto begin = audio_stream_.begin();
 285                 auto end   = begin + audio_cadence_.front() * channel_layout_.num_channels;
 286
 287                 core::mutable_audio_buffer samples(begin, end);
 288                 audio_stream_.erase(begin, end);
 289
 290                 boost::range::rotate(audio_cadence_, std::begin(audio_cadence_)+1);
 291
 292                 return samples;
 293         }
 294
 295         void update_display_mode(const std::shared_ptr<AVFrame>& frame)
 296         {
 297                 std::wstring filter_str = filter_str_;
 298
 299                 display_mode_ = display_mode::simple;
 300
 301                 auto mode = get_mode(*frame);
 302                 if(mode == core::field_mode::progressive && frame->height < 720 && in_fps_ < 50.0) // SD frames are interlaced. Probably incorrect meta-data. Fix it.
 303                         mode = core::field_mode::upper;
 304
 305                 auto fps  = in_fps_;
 306
 307                 if(filter::is_deinterlacing(filter_str_))
 308                         mode = core::field_mode::progressive;
 309
 310                 if(filter::is_double_rate(filter_str_))
 311                         fps *= 2;
 312
 313                 display_mode_ = get_display_mode(mode, fps, format_desc_.field_mode, format_desc_.fps);
 314
 315                 if((frame->height != 480 || format_desc_.height != 486) && // don't deinterlace for NTSC DV
 316                                 display_mode_ == display_mode::simple && mode != core::field_mode::progressive && format_desc_.field_mode != core::field_mode::progressive &&
 317                                 frame->height != format_desc_.height)
 318                 {
 319                         display_mode_ = display_mode::deinterlace_bob_reinterlace; // The frame will most likely be scaled, we need to deinterlace->reinterlace
 320                 }
 321
 322                 // ALWAYS de-interlace, until we have GPU de-interlacing.
 323                 if(force_deinterlacing_ && frame->interlaced_frame && display_mode_ != display_mode::deinterlace_bob && display_mode_ != display_mode::deinterlace)
 324                         display_mode_ = display_mode::deinterlace_bob_reinterlace;
 325
 326                 if(display_mode_ == display_mode::deinterlace)
 327                         filter_str = append_filter(filter_str, L"YADIF=0:-1");
 328                 else if(display_mode_ == display_mode::deinterlace_bob || display_mode_ == display_mode::deinterlace_bob_reinterlace)
 329                         filter_str = append_filter(filter_str, L"YADIF=1:-1");
 330
 331                 if(display_mode_ == display_mode::invalid)
 332                 {
 333                         if (!ffmpeg::is_logging_disabled_for_thread())
 334                                 CASPAR_LOG(warning) << L"[frame_muxer] Auto-transcode: Failed to detect display-mode.";
 335                         display_mode_ = display_mode::simple;
 336                 }
 337
 338                 if(frame->height == 480) // NTSC DV
 339                 {
 340                         auto pad_str = L"PAD=" + boost::lexical_cast<std::wstring>(frame->width) + L":486:0:2:black";
 341                         filter_str = append_filter(filter_str, pad_str);
 342                 }
 343
 344                 filter_.reset (new filter(
 345                         frame->width,
 346                         frame->height,
 347                         boost::rational<int>(1000000, static_cast<int>(in_fps_ * 1000000)),
 348                         boost::rational<int>(static_cast<int>(in_fps_ * 1000000), 1000000),
 349                         boost::rational<int>(frame->sample_aspect_ratio.num, frame->sample_aspect_ratio.den),
 350                         static_cast<AVPixelFormat>(frame->format),
 351                         std::vector<AVPixelFormat>(),
 352                         u8(filter_str)));
 353
 354                 if (!ffmpeg::is_logging_disabled_for_thread())
 355                         CASPAR_LOG(info) << L"[frame_muxer] " << display_mode_ << L" " << print_mode(frame->width, frame->height, in_fps_, frame->interlaced_frame > 0);
 356         }
 357
 358         uint32_t calc_nb_frames(uint32_t nb_frames) const
 359         {
 360                 uint64_t nb_frames2 = nb_frames;
 361
 362                 if(filter_ && filter_->is_double_rate()) // Take into account transformations in filter.
 363                         nb_frames2 *= 2;
 364
 365                 switch(display_mode_) // Take into account transformation in run.
 366                 {
 367                 case display_mode::deinterlace_bob_reinterlace:
 368                 case display_mode::interlace:
 369                 case display_mode::half:
 370                         nb_frames2 /= 2;
 371                         break;
 372                 case display_mode::duplicate:
 373                         nb_frames2 *= 2;
 374                         break;
 375                 }
 376
 377                 return static_cast<uint32_t>(nb_frames2);
 378         }
 379
 380         void clear()
 381         {
 382                 while(!video_stream_.empty())
 383                         video_stream_.pop();
 384
 385                 audio_stream_.clear();
 386
 387                 while(!frame_buffer_.empty())
 388                         frame_buffer_.pop();
 389
 390                 filter_.reset();
 391         }
 392 };
 393
 394 frame_muxer::frame_muxer(
 395                 double in_fps,
 396                 const spl::shared_ptr<core::frame_factory>& frame_factory,
 397                 const core::video_format_desc& format_desc,
 398                 const core::audio_channel_layout& channel_layout,
 399                 const std::wstring& filter)
 400         : impl_(new impl(in_fps, frame_factory, format_desc, channel_layout, filter)){}
 401 void frame_muxer::push_video(const std::shared_ptr<AVFrame>& frame){impl_->push_video(frame);}
 402 void frame_muxer::push_audio(const std::shared_ptr<AVFrame>& frame){impl_->push_audio(frame);}
 403 bool frame_muxer::empty() const{return impl_->empty();}
 404 core::draw_frame frame_muxer::front() const{return impl_->front();}
 405 void frame_muxer::pop(){return impl_->pop();}
 406 void frame_muxer::clear(){impl_->clear();}
 407 uint32_t frame_muxer::calc_nb_frames(uint32_t nb_frames) const {return impl_->calc_nb_frames(nb_frames);}
 408 bool frame_muxer::video_ready() const{return impl_->video_ready();}
 409 bool frame_muxer::audio_ready() const{return impl_->audio_ready();}
 410
 411 }}