]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/muxer/frame_muxer.cpp
2.0.2: Merged ntsc-audio-exp branch for proper/native NTSC audio support.
[casparcg] / modules / ffmpeg / producer / muxer / frame_muxer.cpp
1 #include "../../StdAfx.h"\r
2 \r
3 #include "frame_muxer.h"\r
4 \r
5 #include "display_mode.h"\r
6 \r
7 #include "../filter/filter.h"\r
8 #include "../util/util.h"\r
9 \r
10 #include <core/producer/frame_producer.h>\r
11 #include <core/producer/frame/basic_frame.h>\r
12 #include <core/producer/frame/frame_transform.h>\r
13 #include <core/producer/frame/pixel_format.h>\r
14 #include <core/producer/frame/frame_factory.h>\r
15 #include <core/mixer/write_frame.h>\r
16 \r
17 #include <common/env.h>\r
18 #include <common/exception/exceptions.h>\r
19 #include <common/log/log.h>\r
20 \r
21 #if defined(_MSC_VER)\r
22 #pragma warning (push)\r
23 #pragma warning (disable : 4244)\r
24 #endif\r
25 extern "C" \r
26 {\r
27         #define __STDC_CONSTANT_MACROS\r
28         #define __STDC_LIMIT_MACROS\r
29         #include <libavcodec/avcodec.h>\r
30         #include <libavformat/avformat.h>\r
31 }\r
32 #if defined(_MSC_VER)\r
33 #pragma warning (pop)\r
34 #endif\r
35 \r
36 #include <boost/foreach.hpp>\r
37 #include <boost/range/algorithm_ext/push_back.hpp>\r
38 \r
39 #include <deque>\r
40 #include <queue>\r
41 #include <vector>\r
42 \r
43 using namespace caspar::core;\r
44 \r
45 namespace caspar { namespace ffmpeg {\r
46         \r
47 struct frame_muxer::implementation : boost::noncopyable\r
48 {       \r
49         std::queue<std::queue<safe_ptr<write_frame>>>   video_streams_;\r
50         std::queue<core::audio_buffer>                                  audio_streams_;\r
51         std::queue<safe_ptr<basic_frame>>                               frame_buffer_;\r
52         display_mode::type                                                              display_mode_;\r
53         const double                                                                    in_fps_;\r
54         const video_format_desc                                                 format_desc_;\r
55         bool                                                                                    auto_transcode_;\r
56         \r
57         std::vector<size_t>                                                             audio_cadence_;\r
58 \r
59         size_t                                                                                  audio_sample_count_;\r
60         size_t                                                                                  video_frame_count_;\r
61                 \r
62         safe_ptr<core::frame_factory>                                   frame_factory_;\r
63         \r
64         filter                                                                                  filter_;\r
65         std::wstring                                                                    filter_str_;\r
66                 \r
67         implementation(double in_fps, const safe_ptr<core::frame_factory>& frame_factory, const std::wstring& filter_str)\r
68                 : display_mode_(display_mode::invalid)\r
69                 , in_fps_(in_fps)\r
70                 , format_desc_(frame_factory->get_video_format_desc())\r
71                 , auto_transcode_(env::properties().get("configuration.auto-transcode", true))\r
72                 , audio_cadence_(format_desc_.audio_cadence)\r
73                 , audio_sample_count_(0)\r
74                 , video_frame_count_(0)\r
75                 , frame_factory_(frame_factory)\r
76                 , filter_str_(filter_str)\r
77         {\r
78                 video_streams_.push(std::queue<safe_ptr<write_frame>>());\r
79                 audio_streams_.push(core::audio_buffer());\r
80                 boost::range::sort(audio_cadence_);\r
81                 boost::range::reverse(audio_cadence_);\r
82         }\r
83 \r
84         void push(const std::shared_ptr<AVFrame>& video_frame, int hints)\r
85         {               \r
86                 if(!video_frame)\r
87                         return;\r
88                 \r
89                 if(video_frame == flush_video())\r
90                 {       \r
91                         video_frame_count_ = 0;\r
92                         video_streams_.push(std::queue<safe_ptr<write_frame>>());\r
93                 }\r
94                 else if(video_frame == empty_video())\r
95                 {\r
96                         video_streams_.back().push(make_safe<core::write_frame>(this));\r
97                         ++video_frame_count_;\r
98                         display_mode_ = display_mode::simple;\r
99                 }\r
100                 else\r
101                 {\r
102                         if(display_mode_ == display_mode::invalid)\r
103                                 initialize_display_mode(*video_frame);\r
104                                 \r
105                         if(hints & core::frame_producer::ALPHA_HINT)\r
106                                 video_frame->format = make_alpha_format(video_frame->format);\r
107                 \r
108                         auto format = video_frame->format;\r
109                         if(video_frame->format == CASPAR_PIX_FMT_LUMA) // CASPAR_PIX_FMT_LUMA is not valid for filter, change it to GRAY8\r
110                                 video_frame->format = PIX_FMT_GRAY8;\r
111 \r
112                         filter_.push(video_frame);\r
113                         BOOST_FOREACH(auto& av_frame, filter_.poll_all())\r
114                         {\r
115                                 if(video_frame->format == PIX_FMT_GRAY8 && format == CASPAR_PIX_FMT_LUMA)\r
116                                         av_frame->format = format;\r
117 \r
118                                 video_streams_.back().push(make_write_frame(this, av_frame, frame_factory_, hints));\r
119                                 ++video_frame_count_;\r
120                         }\r
121                 }\r
122 \r
123                 if(video_streams_.back().size() > 32)\r
124                         BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("video-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
125         }\r
126 \r
127         void push(const std::shared_ptr<core::audio_buffer>& audio)\r
128         {\r
129                 if(!audio)      \r
130                         return;\r
131 \r
132                 if(audio == flush_audio())\r
133                 {\r
134                         audio_sample_count_ = 0;\r
135                         audio_streams_.push(core::audio_buffer());\r
136                 }\r
137                 else if(audio == empty_audio())\r
138                 {\r
139                         boost::range::push_back(audio_streams_.back(), core::audio_buffer(audio_cadence_.front(), 0));\r
140                         audio_sample_count_ += audio->size();\r
141                 }\r
142                 else\r
143                 {\r
144                         boost::range::push_back(audio_streams_.back(), *audio);\r
145                         audio_sample_count_ += audio->size();\r
146                 }\r
147 \r
148                 if(audio_streams_.back().size() > 32*audio_cadence_.front())\r
149                         BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("audio-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
150         }\r
151         \r
152         bool video_ready() const\r
153         {               \r
154                 return video_streams_.size() > 1 || (video_streams_.size() >= audio_streams_.size() && video_ready2());\r
155         }\r
156         \r
157         bool audio_ready() const\r
158         {\r
159                 return audio_streams_.size() > 1 || (audio_streams_.size() >= video_streams_.size() && audio_ready2());\r
160         }\r
161 \r
162         bool video_ready2() const\r
163         {               \r
164                 switch(display_mode_)\r
165                 {\r
166                 case display_mode::deinterlace_bob_reinterlace:                                 \r
167                 case display_mode::interlace:   \r
168                 case display_mode::half:\r
169                         return video_streams_.front().size() >= 2;\r
170                 default:                                                                                \r
171                         return video_streams_.front().size() >= 1;\r
172                 }\r
173         }\r
174         \r
175         bool audio_ready2() const\r
176         {\r
177                 switch(display_mode_)\r
178                 {\r
179                 case display_mode::duplicate:                                   \r
180                         return audio_streams_.front().size()/2 >= audio_cadence_.front();\r
181                 default:                                                                                \r
182                         return audio_streams_.front().size() >= audio_cadence_.front();\r
183                 }\r
184         }\r
185                 \r
186         std::shared_ptr<basic_frame> poll()\r
187         {\r
188                 if(!frame_buffer_.empty())\r
189                 {\r
190                         auto frame = frame_buffer_.front();\r
191                         frame_buffer_.pop();    \r
192                         return frame;\r
193                 }\r
194 \r
195                 if(video_streams_.size() > 1 && audio_streams_.size() > 1 && (!video_ready2() || !audio_ready2()))\r
196                 {\r
197                         if(!video_streams_.front().empty() || !audio_streams_.front().empty())\r
198                                 CASPAR_LOG(debug) << "Truncating: " << video_streams_.front().size() << L" video-frames, " << audio_streams_.front().size() << L" audio-samples.";\r
199 \r
200                         video_streams_.pop();\r
201                         audio_streams_.pop();\r
202                 }\r
203 \r
204                 if(!video_ready2() || !audio_ready2())\r
205                         return nullptr;\r
206                                 \r
207                 auto frame1                             = pop_video();\r
208                 frame1->audio_data()    = pop_audio();\r
209 \r
210                 switch(display_mode_)\r
211                 {\r
212                 case display_mode::simple:                                              \r
213                 case display_mode::deinterlace_bob:                             \r
214                 case display_mode::deinterlace: \r
215                 {\r
216                         frame_buffer_.push(frame1);\r
217                         break;\r
218                 }\r
219                 case display_mode::interlace:                                   \r
220                 case display_mode::deinterlace_bob_reinterlace: \r
221                 {                               \r
222                         auto frame2 = pop_video();\r
223 \r
224                         frame_buffer_.push(core::basic_frame::interlace(frame1, frame2, format_desc_.field_mode));      \r
225                         break;\r
226                 }\r
227                 case display_mode::duplicate:   \r
228                 {\r
229                         auto frame2                             = make_safe<core::write_frame>(*frame1);\r
230                         frame2->audio_data()    = pop_audio();\r
231 \r
232                         frame_buffer_.push(frame1);\r
233                         frame_buffer_.push(frame2);\r
234                         break;\r
235                 }\r
236                 case display_mode::half:        \r
237                 {                               \r
238                         pop_video(); // Throw away\r
239 \r
240                         frame_buffer_.push(frame1);\r
241                         break;\r
242                 }\r
243                 default:                                                                                \r
244                         BOOST_THROW_EXCEPTION(invalid_operation() << msg_info("invalid display-mode"));\r
245                 }\r
246                 \r
247                 return frame_buffer_.empty() ? nullptr : poll();\r
248         }\r
249         \r
250         safe_ptr<core::write_frame> pop_video()\r
251         {\r
252                 auto frame = video_streams_.front().front();\r
253                 video_streams_.front().pop();           \r
254                 return frame;\r
255         }\r
256 \r
257         core::audio_buffer pop_audio()\r
258         {\r
259                 CASPAR_VERIFY(audio_streams_.front().size() >= audio_cadence_.front());\r
260 \r
261                 auto begin = audio_streams_.front().begin();\r
262                 auto end   = begin + audio_cadence_.front();\r
263 \r
264                 core::audio_buffer samples(begin, end);\r
265                 audio_streams_.front().erase(begin, end);\r
266                 \r
267                 boost::range::rotate(audio_cadence_, std::begin(audio_cadence_)+1);\r
268 \r
269                 return samples;\r
270         }\r
271                                 \r
272         void initialize_display_mode(const AVFrame& frame)\r
273         {\r
274                 display_mode_ = display_mode::simple;\r
275                 if(auto_transcode_)\r
276                 {\r
277                         auto mode = get_mode(frame);\r
278                         auto fps  = in_fps_;\r
279 \r
280                         if(is_deinterlacing(filter_str_))\r
281                                 mode = core::field_mode::progressive;\r
282 \r
283                         if(is_double_rate(filter_str_))\r
284                                 fps *= 2;\r
285                         \r
286                         display_mode_ = get_display_mode(mode, fps, format_desc_.field_mode, format_desc_.fps);\r
287                         \r
288                         if((frame.height != 480 || format_desc_.height != 486) && \r
289                                 display_mode_ == display_mode::simple && mode != core::field_mode::progressive && format_desc_.field_mode != core::field_mode::progressive && \r
290                                 frame.height != static_cast<int>(format_desc_.height))\r
291                         {\r
292                                 display_mode_ = display_mode::deinterlace_bob_reinterlace; // The frame will most likely be scaled, we need to deinterlace->reinterlace \r
293                         }\r
294 \r
295                         if(display_mode_ == display_mode::deinterlace)\r
296                                 filter_str_ = append_filter(filter_str_, L"YADIF=0:-1");\r
297                         else if(display_mode_ == display_mode::deinterlace_bob || display_mode_ == display_mode::deinterlace_bob_reinterlace)\r
298                                 filter_str_ = append_filter(filter_str_, L"YADIF=1:-1");\r
299                 }\r
300 \r
301                 if(display_mode_ == display_mode::invalid)\r
302                 {\r
303                         CASPAR_LOG(warning) << L"[frame_muxer] Auto-transcode: Failed to detect display-mode.";\r
304                         display_mode_ = display_mode::simple;\r
305                 }\r
306                         \r
307                 filter_ = filter(filter_str_);\r
308 \r
309                 CASPAR_LOG(info) << "[frame_muxer] " << display_mode::print(display_mode_) \r
310                         << L" " << frame.width << L"x" << frame.height \r
311                         << (frame.interlaced_frame ? L"i" : L"p") \r
312                         << (frame.interlaced_frame ? in_fps_*2 : in_fps_);\r
313         }\r
314 \r
315         int64_t calc_nb_frames(int64_t nb_frames) const\r
316         {\r
317                 switch(display_mode_) // Take into account transformation in run.\r
318                 {\r
319                 case display_mode::deinterlace_bob_reinterlace:\r
320                 case display_mode::interlace:   \r
321                 case display_mode::half:\r
322                         nb_frames /= 2;\r
323                         break;\r
324                 case display_mode::duplicate:\r
325                         nb_frames *= 2;\r
326                         break;\r
327                 }\r
328 \r
329                 if(is_double_rate(widen(filter_.filter_str()))) // Take into account transformations in filter.\r
330                         nb_frames *= 2;\r
331 \r
332                 return nb_frames;\r
333         }\r
334 };\r
335 \r
336 frame_muxer::frame_muxer(double in_fps, const safe_ptr<core::frame_factory>& frame_factory, const std::wstring& filter)\r
337         : impl_(new implementation(in_fps, frame_factory, filter)){}\r
338 void frame_muxer::push(const std::shared_ptr<AVFrame>& video_frame, int hints){impl_->push(video_frame, hints);}\r
339 void frame_muxer::push(const std::shared_ptr<core::audio_buffer>& audio_samples){return impl_->push(audio_samples);}\r
340 std::shared_ptr<basic_frame> frame_muxer::poll(){return impl_->poll();}\r
341 int64_t frame_muxer::calc_nb_frames(int64_t nb_frames) const {return impl_->calc_nb_frames(nb_frames);}\r
342 bool frame_muxer::video_ready() const{return impl_->video_ready();}\r
343 bool frame_muxer::audio_ready() const{return impl_->audio_ready();}\r
344 \r
345 }}