]> git.sesse.net Git - casparcg/blobdiff - modules/ffmpeg/producer/frame_muxer.cpp
2.0. audio: Audio pipeline is now in 32 bit.
[casparcg] / modules / ffmpeg / producer / frame_muxer.cpp
index 860df1c1ba91a49a334390f23cf38cc88281765d..affb1c329c6469e4270228f6e73075b0a004ded5 100644 (file)
@@ -8,7 +8,7 @@
 \r
 #include <core/producer/frame_producer.h>\r
 #include <core/producer/frame/basic_frame.h>\r
-#include <core/producer/frame/image_transform.h>\r
+#include <core/producer/frame/frame_transform.h>\r
 #include <core/producer/frame/pixel_format.h>\r
 #include <core/producer/frame/frame_factory.h>\r
 #include <core/mixer/write_frame.h>\r
@@ -82,35 +82,49 @@ struct display_mode
        }\r
 };\r
 \r
-display_mode::type get_display_mode(const core::video_mode::type in_mode, double in_fps, const core::video_mode::type out_mode, double out_fps)\r
+display_mode::type get_display_mode(const core::field_mode::type in_mode, double in_fps, const core::field_mode::type out_mode, double out_fps)\r
 {              \r
        static const auto epsilon = 2.0;\r
 \r
+       if(in_fps < 20.0 || in_fps > 80.0)\r
+       {\r
+               //if(out_mode != core::field_mode::progressive && in_mode == core::field_mode::progressive)\r
+               //      return display_mode::interlace;\r
+               \r
+               if(out_mode == core::field_mode::progressive && in_mode != core::field_mode::progressive)\r
+               {\r
+                       if(in_fps < 35.0)\r
+                               return display_mode::deinterlace;\r
+                       else\r
+                               return display_mode::deinterlace_bob;\r
+               }\r
+       }\r
+\r
        if(std::abs(in_fps - out_fps) < epsilon)\r
        {\r
-               if(in_mode != core::video_mode::progressive && out_mode == core::video_mode::progressive)\r
+               if(in_mode != core::field_mode::progressive && out_mode == core::field_mode::progressive)\r
                        return display_mode::deinterlace;\r
-               //else if(in_mode == core::video_mode::progressive && out_mode != core::video_mode::progressive)\r
+               //else if(in_mode == core::field_mode::progressive && out_mode != core::field_mode::progressive)\r
                //      simple(); // interlace_duplicate();\r
                else\r
                        return display_mode::simple;\r
        }\r
        else if(std::abs(in_fps/2.0 - out_fps) < epsilon)\r
        {\r
-               if(in_mode != core::video_mode::progressive)\r
+               if(in_mode != core::field_mode::progressive)\r
                        return display_mode::invalid;\r
 \r
-               if(out_mode != core::video_mode::progressive)\r
+               if(out_mode != core::field_mode::progressive)\r
                        return display_mode::interlace;\r
                else\r
                        return display_mode::half;\r
        }\r
        else if(std::abs(in_fps - out_fps/2.0) < epsilon)\r
        {\r
-               if(out_mode != core::video_mode::progressive)\r
+               if(out_mode != core::field_mode::progressive)\r
                        return display_mode::invalid;\r
 \r
-               if(in_mode != core::video_mode::progressive)\r
+               if(in_mode != core::field_mode::progressive)\r
                        return display_mode::deinterlace_bob;\r
                else\r
                        return display_mode::duplicate;\r
@@ -122,12 +136,12 @@ display_mode::type get_display_mode(const core::video_mode::type in_mode, double
 struct frame_muxer::implementation : boost::noncopyable\r
 {      \r
        std::deque<std::queue<safe_ptr<write_frame>>>   video_streams_;\r
-       std::deque<std::vector<int16_t>>                                audio_streams_;\r
+       std::deque<std::vector<int32_t>>                                audio_streams_;\r
        std::deque<safe_ptr<basic_frame>>                               frame_buffer_;\r
        display_mode::type                                                              display_mode_;\r
        const double                                                                    in_fps_;\r
        const video_format_desc                                                 format_desc_;\r
-       bool                                                                                    auto_mode_;\r
+       bool                                                                                    auto_transcode_;\r
 \r
        size_t                                                                                  audio_sample_count_;\r
        size_t                                                                                  video_frame_count_;\r
@@ -144,7 +158,7 @@ struct frame_muxer::implementation : boost::noncopyable
                , display_mode_(display_mode::invalid)\r
                , in_fps_(in_fps)\r
                , format_desc_(frame_factory->get_video_format_desc())\r
-               , auto_mode_(env::properties().get("configuration.auto-mode", false))\r
+               , auto_transcode_(env::properties().get("configuration.producers.auto-transcode", false))\r
                , audio_sample_count_(0)\r
                , video_frame_count_(0)\r
                , frame_factory_(frame_factory)\r
@@ -171,12 +185,12 @@ struct frame_muxer::implementation : boost::noncopyable
 \r
                if(display_mode_ == display_mode::invalid)\r
                {\r
-                       if(auto_mode_)\r
+                       if(auto_transcode_)\r
                        {\r
                                auto in_mode = get_mode(*video_frame);\r
-                               display_mode_ = get_display_mode(in_mode, in_fps_, format_desc_.mode, format_desc_.fps);\r
+                               display_mode_ = get_display_mode(in_mode, in_fps_, format_desc_.field_mode, format_desc_.fps);\r
                        \r
-                               if(display_mode_ == display_mode::simple && in_mode != core::video_mode::progressive && format_desc_.mode != core::video_mode::progressive && video_frame->height != static_cast<int>(format_desc_.height))\r
+                               if(display_mode_ == display_mode::simple && in_mode != core::field_mode::progressive && format_desc_.field_mode != core::field_mode::progressive && video_frame->height != static_cast<int>(format_desc_.height))\r
                                        display_mode_ = display_mode::deinterlace_bob_reinterlace; // The frame will most likely be scaled, we need to deinterlace->reinterlace \r
                                \r
                                if(display_mode_ == display_mode::deinterlace)\r
@@ -195,31 +209,41 @@ struct frame_muxer::implementation : boost::noncopyable
 \r
                        CASPAR_LOG(info) << "[frame_muxer] " << display_mode::print(display_mode_);\r
                }\r
+\r
                                \r
                if(hints & core::frame_producer::ALPHA_HINT)\r
-                       try_make_gray(make_safe(video_frame));\r
+                       video_frame->format = make_alpha_format(video_frame->format);\r
+               \r
+               auto format = video_frame->format;\r
+               if(video_frame->format == CASPAR_PIX_FMT_LUMA) // CASPAR_PIX_FMT_LUMA is not valid for filter, change it to GRAY8\r
+                       video_frame->format = PIX_FMT_GRAY8;\r
 \r
                BOOST_FOREACH(auto& av_frame, filter_.execute(video_frame))\r
                {\r
+                       av_frame->format = format;\r
+\r
                        auto frame = make_write_frame(this, av_frame, frame_factory_, hints);\r
 \r
                        // Fix field-order if needed\r
-                       if(frame->get_type() == core::video_mode::lower && format_desc_.mode == core::video_mode::upper)\r
-                               frame->get_image_transform().set_fill_translation(0.0f, 0.5/static_cast<double>(frame->get_pixel_format_desc().planes[0].height));\r
-                       else if(frame->get_type() == core::video_mode::upper && format_desc_.mode == core::video_mode::lower)\r
-                               frame->get_image_transform().set_fill_translation(0.0f, -0.5/static_cast<double>(frame->get_pixel_format_desc().planes[0].height));\r
+                       if(frame->get_type() == core::field_mode::lower && format_desc_.field_mode == core::field_mode::upper)\r
+                               frame->get_frame_transform().fill_translation[1] += 1.0/static_cast<double>(format_desc_.height);\r
+                       else if(frame->get_type() == core::field_mode::upper && format_desc_.field_mode == core::field_mode::lower)\r
+                               frame->get_frame_transform().fill_translation[1] -= 1.0/static_cast<double>(format_desc_.height);\r
 \r
                        video_streams_.back().push(frame);\r
                        ++video_frame_count_;\r
                }\r
+\r
+               if(video_streams_.back().size() > 8)\r
+                       BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("video-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
        }\r
 \r
-       void push(const std::shared_ptr<std::vector<int16_t>>& audio_samples)\r
+       void push(const std::shared_ptr<std::vector<int32_t>>& audio_samples)\r
        {\r
                if(!audio_samples)      \r
                {\r
                        CASPAR_LOG(debug) << L"audio-chunk-count: " << audio_sample_count_/format_desc_.audio_samples_per_frame;\r
-                       audio_streams_.push_back(std::vector<int16_t>());\r
+                       audio_streams_.push_back(std::vector<int32_t>());\r
                        audio_sample_count_ = 0;\r
                        return;\r
                }\r
@@ -227,6 +251,9 @@ struct frame_muxer::implementation : boost::noncopyable
                audio_sample_count_ += audio_samples->size();\r
 \r
                boost::range::push_back(audio_streams_.back(), *audio_samples);\r
+\r
+               if(audio_streams_.back().size() > 8*format_desc_.audio_samples_per_frame)\r
+                       BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("audio-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
        }\r
 \r
        safe_ptr<basic_frame> pop()\r
@@ -249,43 +276,55 @@ struct frame_muxer::implementation : boost::noncopyable
                return frame;\r
        }\r
 \r
-       std::vector<int16_t> pop_audio()\r
+       std::vector<int32_t> pop_audio()\r
        {\r
                CASPAR_VERIFY(audio_streams_.front().size() >= format_desc_.audio_samples_per_frame);\r
 \r
                auto begin = audio_streams_.front().begin();\r
                auto end   = begin + format_desc_.audio_samples_per_frame;\r
 \r
-               auto samples = std::vector<int16_t>(begin, end);\r
+               auto samples = std::vector<int32_t>(begin, end);\r
                audio_streams_.front().erase(begin, end);\r
 \r
                return samples;\r
        }\r
-\r
+       \r
        bool video_ready() const\r
-       {\r
-               return video_frames() > 1 && video_streams_.size() >= audio_streams_.size();\r
+       {               \r
+               return video_streams_.size() > 1 || (video_streams_.size() >= audio_streams_.size() && video_ready2());\r
        }\r
        \r
        bool audio_ready() const\r
        {\r
-               return audio_chunks() > 1 && audio_streams_.size() >= video_streams_.size();\r
+               return audio_streams_.size() > 1 || (audio_streams_.size() >= video_streams_.size() && audio_ready2());\r
        }\r
 \r
-       size_t video_frames() const\r
-       {\r
-               return video_streams_.back().size();\r
+       bool video_ready2() const\r
+       {               \r
+               switch(display_mode_)\r
+               {\r
+               case display_mode::deinterlace_bob_reinterlace:                                 \r
+               case display_mode::interlace:                                   \r
+                       return video_streams_.front().size() >= 2;\r
+               default:                                                                                \r
+                       return !video_streams_.front().empty();\r
+               }\r
        }\r
-\r
-       size_t audio_chunks() const\r
+       \r
+       bool audio_ready2() const\r
        {\r
-               return audio_streams_.back().size() / format_desc_.audio_samples_per_frame;\r
+               switch(display_mode_)\r
+               {\r
+               case display_mode::duplicate:                                   \r
+                       return audio_streams_.front().size()/2 >= format_desc_.audio_samples_per_frame;\r
+               default:                                                                                \r
+                       return audio_streams_.front().size() >= format_desc_.audio_samples_per_frame;\r
+               }\r
        }\r
-       \r
+               \r
        void commit()\r
        {\r
-               if(video_streams_.size() > 1 && audio_streams_.size() > 1 &&\r
-                       (video_streams_.front().empty() || audio_streams_.front().empty()))\r
+               if(video_streams_.size() > 1 && audio_streams_.size() > 1 && (!video_ready2() || !audio_ready2()))\r
                {\r
                        if(!video_streams_.front().empty() || !audio_streams_.front().empty())\r
                                CASPAR_LOG(debug) << "Truncating: " << video_streams_.front().size() << L" video-frames, " << audio_streams_.front().size() << L" audio-samples.";\r
@@ -294,7 +333,7 @@ struct frame_muxer::implementation : boost::noncopyable
                        audio_streams_.pop_front();\r
                }\r
 \r
-               if(video_streams_.front().empty() || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
+               if(!video_ready2() || !audio_ready2())\r
                        return;\r
                \r
                switch(display_mode_)\r
@@ -309,12 +348,9 @@ struct frame_muxer::implementation : boost::noncopyable
                default:                                                                                BOOST_THROW_EXCEPTION(invalid_operation() << msg_info("invalid display-mode"));\r
                }\r
        }\r
-\r
+       \r
        void simple(std::deque<safe_ptr<basic_frame>>& dest)\r
-       {\r
-               if(video_streams_.front().empty() || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
-                       return;\r
-               \r
+       {               \r
                auto frame1 = pop_video();\r
                frame1->audio_data() = pop_audio();\r
 \r
@@ -323,9 +359,6 @@ struct frame_muxer::implementation : boost::noncopyable
 \r
        void duplicate(std::deque<safe_ptr<basic_frame>>& dest)\r
        {               \r
-               if(video_streams_.front().empty() || audio_streams_.front().size()/2 < format_desc_.audio_samples_per_frame)\r
-                       return;\r
-\r
                auto frame = pop_video();\r
 \r
                auto frame1 = make_safe<core::write_frame>(*frame); // make a copy\r
@@ -339,10 +372,7 @@ struct frame_muxer::implementation : boost::noncopyable
        }\r
 \r
        void half(std::deque<safe_ptr<basic_frame>>& dest)\r
-       {       \r
-               if(video_streams_.front().size() < 2 || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
-                       return;\r
-                                               \r
+       {                                                       \r
                auto frame1 = pop_video();\r
                frame1->audio_data() = pop_audio();\r
                                \r
@@ -352,28 +382,41 @@ struct frame_muxer::implementation : boost::noncopyable
        }\r
        \r
        void interlace(std::deque<safe_ptr<basic_frame>>& dest)\r
-       {               \r
-               if(video_streams_.front().size() < 2 || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
-                       return;\r
-               \r
+       {                               \r
                auto frame1 = pop_video();\r
                frame1->audio_data() = pop_audio();\r
                                \r
                auto frame2 = pop_video();\r
 \r
-               dest.push_back(core::basic_frame::interlace(frame1, frame2, format_desc_.mode));                \r
+               dest.push_back(core::basic_frame::interlace(frame1, frame2, format_desc_.field_mode));          \r
+       }\r
+       \r
+       int64_t calc_nb_frames(int64_t nb_frames) const\r
+       {\r
+               switch(display_mode_)\r
+               {\r
+               case display_mode::interlace:\r
+               case display_mode::half:\r
+                       return nb_frames/2;\r
+               case display_mode::duplicate:\r
+               case display_mode::deinterlace_bob:\r
+                       return nb_frames*2;\r
+               default:\r
+                       return nb_frames;\r
+               }\r
        }\r
 };\r
 \r
 frame_muxer::frame_muxer(double in_fps, const safe_ptr<core::frame_factory>& frame_factory)\r
        : impl_(new implementation(in_fps, frame_factory)){}\r
 void frame_muxer::push(const std::shared_ptr<AVFrame>& video_frame, int hints){impl_->push(video_frame, hints);}\r
-void frame_muxer::push(const std::shared_ptr<std::vector<int16_t>>& audio_samples){return impl_->push(audio_samples);}\r
+void frame_muxer::push(const std::shared_ptr<std::vector<int32_t>>& audio_samples){return impl_->push(audio_samples);}\r
 void frame_muxer::commit(){impl_->commit();}\r
 safe_ptr<basic_frame> frame_muxer::pop(){return impl_->pop();}\r
 size_t frame_muxer::size() const {return impl_->size();}\r
 bool frame_muxer::empty() const {return impl_->size() == 0;}\r
 bool frame_muxer::video_ready() const{return impl_->video_ready();}\r
 bool frame_muxer::audio_ready() const{return impl_->audio_ready();}\r
+int64_t frame_muxer::calc_nb_frames(int64_t nb_frames) const {return impl_->calc_nb_frames(nb_frames);}\r
 \r
 }
\ No newline at end of file