]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/frame_muxer.cpp
affb1c329c6469e4270228f6e73075b0a004ded5
[casparcg] / modules / ffmpeg / producer / frame_muxer.cpp
1 #include "../StdAfx.h"\r
2 \r
3 #include "frame_muxer.h"\r
4 \r
5 #include "filter/filter.h"\r
6 \r
7 #include "util.h"\r
8 \r
9 #include <core/producer/frame_producer.h>\r
10 #include <core/producer/frame/basic_frame.h>\r
11 #include <core/producer/frame/frame_transform.h>\r
12 #include <core/producer/frame/pixel_format.h>\r
13 #include <core/producer/frame/frame_factory.h>\r
14 #include <core/mixer/write_frame.h>\r
15 \r
16 #include <common/env.h>\r
17 #include <common/exception/exceptions.h>\r
18 #include <common/log/log.h>\r
19 \r
20 #if defined(_MSC_VER)\r
21 #pragma warning (push)\r
22 #pragma warning (disable : 4244)\r
23 #endif\r
24 extern "C" \r
25 {\r
26         #define __STDC_CONSTANT_MACROS\r
27         #define __STDC_LIMIT_MACROS\r
28         #include <libavcodec/avcodec.h>\r
29         #include <libavformat/avformat.h>\r
30 }\r
31 #if defined(_MSC_VER)\r
32 #pragma warning (pop)\r
33 #endif\r
34 \r
35 #include <boost/foreach.hpp>\r
36 #include <boost/range/algorithm_ext/push_back.hpp>\r
37 \r
38 #include <deque>\r
39 #include <queue>\r
40 #include <vector>\r
41 \r
42 using namespace caspar::core;\r
43 \r
44 namespace caspar {\r
45 \r
46 struct display_mode\r
47 {\r
48         enum type\r
49         {\r
50                 simple,\r
51                 duplicate,\r
52                 half,\r
53                 interlace,\r
54                 deinterlace_bob,\r
55                 deinterlace_bob_reinterlace,\r
56                 deinterlace,\r
57                 count,\r
58                 invalid\r
59         };\r
60 \r
61         static std::wstring print(display_mode::type value)\r
62         {\r
63                 switch(value)\r
64                 {\r
65                         case simple:\r
66                                 return L"simple";\r
67                         case duplicate:\r
68                                 return L"duplicate";\r
69                         case half:\r
70                                 return L"half";\r
71                         case interlace:\r
72                                 return L"interlace";\r
73                         case deinterlace_bob:\r
74                                 return L"deinterlace_bob";\r
75                         case deinterlace_bob_reinterlace:\r
76                                 return L"deinterlace_bob_reinterlace";\r
77                         case deinterlace:\r
78                                 return L"deinterlace";\r
79                         default:\r
80                                 return L"invalid";\r
81                 }\r
82         }\r
83 };\r
84 \r
85 display_mode::type get_display_mode(const core::field_mode::type in_mode, double in_fps, const core::field_mode::type out_mode, double out_fps)\r
86 {               \r
87         static const auto epsilon = 2.0;\r
88 \r
89         if(in_fps < 20.0 || in_fps > 80.0)\r
90         {\r
91                 //if(out_mode != core::field_mode::progressive && in_mode == core::field_mode::progressive)\r
92                 //      return display_mode::interlace;\r
93                 \r
94                 if(out_mode == core::field_mode::progressive && in_mode != core::field_mode::progressive)\r
95                 {\r
96                         if(in_fps < 35.0)\r
97                                 return display_mode::deinterlace;\r
98                         else\r
99                                 return display_mode::deinterlace_bob;\r
100                 }\r
101         }\r
102 \r
103         if(std::abs(in_fps - out_fps) < epsilon)\r
104         {\r
105                 if(in_mode != core::field_mode::progressive && out_mode == core::field_mode::progressive)\r
106                         return display_mode::deinterlace;\r
107                 //else if(in_mode == core::field_mode::progressive && out_mode != core::field_mode::progressive)\r
108                 //      simple(); // interlace_duplicate();\r
109                 else\r
110                         return display_mode::simple;\r
111         }\r
112         else if(std::abs(in_fps/2.0 - out_fps) < epsilon)\r
113         {\r
114                 if(in_mode != core::field_mode::progressive)\r
115                         return display_mode::invalid;\r
116 \r
117                 if(out_mode != core::field_mode::progressive)\r
118                         return display_mode::interlace;\r
119                 else\r
120                         return display_mode::half;\r
121         }\r
122         else if(std::abs(in_fps - out_fps/2.0) < epsilon)\r
123         {\r
124                 if(out_mode != core::field_mode::progressive)\r
125                         return display_mode::invalid;\r
126 \r
127                 if(in_mode != core::field_mode::progressive)\r
128                         return display_mode::deinterlace_bob;\r
129                 else\r
130                         return display_mode::duplicate;\r
131         }\r
132 \r
133         return display_mode::invalid;\r
134 }\r
135 \r
136 struct frame_muxer::implementation : boost::noncopyable\r
137 {       \r
138         std::deque<std::queue<safe_ptr<write_frame>>>   video_streams_;\r
139         std::deque<std::vector<int32_t>>                                audio_streams_;\r
140         std::deque<safe_ptr<basic_frame>>                               frame_buffer_;\r
141         display_mode::type                                                              display_mode_;\r
142         const double                                                                    in_fps_;\r
143         const video_format_desc                                                 format_desc_;\r
144         bool                                                                                    auto_transcode_;\r
145 \r
146         size_t                                                                                  audio_sample_count_;\r
147         size_t                                                                                  video_frame_count_;\r
148                 \r
149         size_t                                                                                  processed_audio_sample_count_;\r
150         size_t                                                                                  processed_video_frame_count_;\r
151 \r
152         filter                                                                                  filter_;\r
153         safe_ptr<core::frame_factory>                                   frame_factory_;\r
154                 \r
155         implementation(double in_fps, const safe_ptr<core::frame_factory>& frame_factory)\r
156                 : video_streams_(1)\r
157                 , audio_streams_(1)\r
158                 , display_mode_(display_mode::invalid)\r
159                 , in_fps_(in_fps)\r
160                 , format_desc_(frame_factory->get_video_format_desc())\r
161                 , auto_transcode_(env::properties().get("configuration.producers.auto-transcode", false))\r
162                 , audio_sample_count_(0)\r
163                 , video_frame_count_(0)\r
164                 , frame_factory_(frame_factory)\r
165         {\r
166         }\r
167 \r
168         void push(const std::shared_ptr<AVFrame>& video_frame, int hints)\r
169         {               \r
170                 if(!video_frame)\r
171                 {       \r
172                         CASPAR_LOG(debug) << L"video-frame-count: " << static_cast<float>(video_frame_count_);\r
173                         video_frame_count_ = 0;\r
174                         video_streams_.push_back(std::queue<safe_ptr<write_frame>>());\r
175                         return;\r
176                 }\r
177 \r
178                 if(video_frame->data[0] == nullptr)\r
179                 {\r
180                         video_streams_.back().push(make_safe<core::write_frame>(this));\r
181                         ++video_frame_count_;\r
182                         display_mode_ = display_mode::simple;\r
183                         return;\r
184                 }\r
185 \r
186                 if(display_mode_ == display_mode::invalid)\r
187                 {\r
188                         if(auto_transcode_)\r
189                         {\r
190                                 auto in_mode = get_mode(*video_frame);\r
191                                 display_mode_ = get_display_mode(in_mode, in_fps_, format_desc_.field_mode, format_desc_.fps);\r
192                         \r
193                                 if(display_mode_ == display_mode::simple && in_mode != core::field_mode::progressive && format_desc_.field_mode != core::field_mode::progressive && video_frame->height != static_cast<int>(format_desc_.height))\r
194                                         display_mode_ = display_mode::deinterlace_bob_reinterlace; // The frame will most likely be scaled, we need to deinterlace->reinterlace \r
195                                 \r
196                                 if(display_mode_ == display_mode::deinterlace)\r
197                                         filter_ = filter(L"YADIF=0:-1");\r
198                                 else if(display_mode_ == display_mode::deinterlace_bob || display_mode_ == display_mode::deinterlace_bob_reinterlace)\r
199                                         filter_ = filter(L"YADIF=1:-1");\r
200                         }\r
201                         else\r
202                                 display_mode_ = display_mode::simple;\r
203 \r
204                         if(display_mode_ == display_mode::invalid)\r
205                         {\r
206                                 CASPAR_LOG(warning) << L"[frame_muxer] Failed to detect display-mode.";\r
207                                 display_mode_ = display_mode::simple;\r
208                         }\r
209 \r
210                         CASPAR_LOG(info) << "[frame_muxer] " << display_mode::print(display_mode_);\r
211                 }\r
212 \r
213                                 \r
214                 if(hints & core::frame_producer::ALPHA_HINT)\r
215                         video_frame->format = make_alpha_format(video_frame->format);\r
216                 \r
217                 auto format = video_frame->format;\r
218                 if(video_frame->format == CASPAR_PIX_FMT_LUMA) // CASPAR_PIX_FMT_LUMA is not valid for filter, change it to GRAY8\r
219                         video_frame->format = PIX_FMT_GRAY8;\r
220 \r
221                 BOOST_FOREACH(auto& av_frame, filter_.execute(video_frame))\r
222                 {\r
223                         av_frame->format = format;\r
224 \r
225                         auto frame = make_write_frame(this, av_frame, frame_factory_, hints);\r
226 \r
227                         // Fix field-order if needed\r
228                         if(frame->get_type() == core::field_mode::lower && format_desc_.field_mode == core::field_mode::upper)\r
229                                 frame->get_frame_transform().fill_translation[1] += 1.0/static_cast<double>(format_desc_.height);\r
230                         else if(frame->get_type() == core::field_mode::upper && format_desc_.field_mode == core::field_mode::lower)\r
231                                 frame->get_frame_transform().fill_translation[1] -= 1.0/static_cast<double>(format_desc_.height);\r
232 \r
233                         video_streams_.back().push(frame);\r
234                         ++video_frame_count_;\r
235                 }\r
236 \r
237                 if(video_streams_.back().size() > 8)\r
238                         BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("video-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
239         }\r
240 \r
241         void push(const std::shared_ptr<std::vector<int32_t>>& audio_samples)\r
242         {\r
243                 if(!audio_samples)      \r
244                 {\r
245                         CASPAR_LOG(debug) << L"audio-chunk-count: " << audio_sample_count_/format_desc_.audio_samples_per_frame;\r
246                         audio_streams_.push_back(std::vector<int32_t>());\r
247                         audio_sample_count_ = 0;\r
248                         return;\r
249                 }\r
250 \r
251                 audio_sample_count_ += audio_samples->size();\r
252 \r
253                 boost::range::push_back(audio_streams_.back(), *audio_samples);\r
254 \r
255                 if(audio_streams_.back().size() > 8*format_desc_.audio_samples_per_frame)\r
256                         BOOST_THROW_EXCEPTION(invalid_operation() << source_info("frame_muxer") << msg_info("audio-stream overflow. This can be caused by incorrect frame-rate. Check clip meta-data."));\r
257         }\r
258 \r
259         safe_ptr<basic_frame> pop()\r
260         {               \r
261                 auto frame = frame_buffer_.front();\r
262                 frame_buffer_.pop_front();              \r
263                 return frame;\r
264         }\r
265 \r
266         size_t size() const\r
267         {\r
268                 return frame_buffer_.size();\r
269         }\r
270 \r
271         safe_ptr<core::write_frame> pop_video()\r
272         {\r
273                 auto frame = video_streams_.front().front();\r
274                 video_streams_.front().pop();\r
275                 \r
276                 return frame;\r
277         }\r
278 \r
279         std::vector<int32_t> pop_audio()\r
280         {\r
281                 CASPAR_VERIFY(audio_streams_.front().size() >= format_desc_.audio_samples_per_frame);\r
282 \r
283                 auto begin = audio_streams_.front().begin();\r
284                 auto end   = begin + format_desc_.audio_samples_per_frame;\r
285 \r
286                 auto samples = std::vector<int32_t>(begin, end);\r
287                 audio_streams_.front().erase(begin, end);\r
288 \r
289                 return samples;\r
290         }\r
291         \r
292         bool video_ready() const\r
293         {               \r
294                 return video_streams_.size() > 1 || (video_streams_.size() >= audio_streams_.size() && video_ready2());\r
295         }\r
296         \r
297         bool audio_ready() const\r
298         {\r
299                 return audio_streams_.size() > 1 || (audio_streams_.size() >= video_streams_.size() && audio_ready2());\r
300         }\r
301 \r
302         bool video_ready2() const\r
303         {               \r
304                 switch(display_mode_)\r
305                 {\r
306                 case display_mode::deinterlace_bob_reinterlace:                                 \r
307                 case display_mode::interlace:                                   \r
308                         return video_streams_.front().size() >= 2;\r
309                 default:                                                                                \r
310                         return !video_streams_.front().empty();\r
311                 }\r
312         }\r
313         \r
314         bool audio_ready2() const\r
315         {\r
316                 switch(display_mode_)\r
317                 {\r
318                 case display_mode::duplicate:                                   \r
319                         return audio_streams_.front().size()/2 >= format_desc_.audio_samples_per_frame;\r
320                 default:                                                                                \r
321                         return audio_streams_.front().size() >= format_desc_.audio_samples_per_frame;\r
322                 }\r
323         }\r
324                 \r
325         void commit()\r
326         {\r
327                 if(video_streams_.size() > 1 && audio_streams_.size() > 1 && (!video_ready2() || !audio_ready2()))\r
328                 {\r
329                         if(!video_streams_.front().empty() || !audio_streams_.front().empty())\r
330                                 CASPAR_LOG(debug) << "Truncating: " << video_streams_.front().size() << L" video-frames, " << audio_streams_.front().size() << L" audio-samples.";\r
331 \r
332                         video_streams_.pop_front();\r
333                         audio_streams_.pop_front();\r
334                 }\r
335 \r
336                 if(!video_ready2() || !audio_ready2())\r
337                         return;\r
338                 \r
339                 switch(display_mode_)\r
340                 {\r
341                 case display_mode::simple:                                              return simple(frame_buffer_);\r
342                 case display_mode::duplicate:                                   return duplicate(frame_buffer_);\r
343                 case display_mode::half:                                                return half(frame_buffer_);\r
344                 case display_mode::interlace:                                   return interlace(frame_buffer_);\r
345                 case display_mode::deinterlace_bob:                             return simple(frame_buffer_);\r
346                 case display_mode::deinterlace_bob_reinterlace: return interlace(frame_buffer_);\r
347                 case display_mode::deinterlace:                                 return simple(frame_buffer_);\r
348                 default:                                                                                BOOST_THROW_EXCEPTION(invalid_operation() << msg_info("invalid display-mode"));\r
349                 }\r
350         }\r
351         \r
352         void simple(std::deque<safe_ptr<basic_frame>>& dest)\r
353         {               \r
354                 auto frame1 = pop_video();\r
355                 frame1->audio_data() = pop_audio();\r
356 \r
357                 dest.push_back(frame1);         \r
358         }\r
359 \r
360         void duplicate(std::deque<safe_ptr<basic_frame>>& dest)\r
361         {               \r
362                 auto frame = pop_video();\r
363 \r
364                 auto frame1 = make_safe<core::write_frame>(*frame); // make a copy\r
365                 frame1->audio_data() = pop_audio();\r
366 \r
367                 auto frame2 = frame;\r
368                 frame2->audio_data() = pop_audio();\r
369 \r
370                 dest.push_back(frame1);\r
371                 dest.push_back(frame2);\r
372         }\r
373 \r
374         void half(std::deque<safe_ptr<basic_frame>>& dest)\r
375         {                                                       \r
376                 auto frame1 = pop_video();\r
377                 frame1->audio_data() = pop_audio();\r
378                                 \r
379                 video_streams_.front().pop(); // Throw away\r
380 \r
381                 dest.push_back(frame1);\r
382         }\r
383         \r
384         void interlace(std::deque<safe_ptr<basic_frame>>& dest)\r
385         {                               \r
386                 auto frame1 = pop_video();\r
387                 frame1->audio_data() = pop_audio();\r
388                                 \r
389                 auto frame2 = pop_video();\r
390 \r
391                 dest.push_back(core::basic_frame::interlace(frame1, frame2, format_desc_.field_mode));          \r
392         }\r
393         \r
394         int64_t calc_nb_frames(int64_t nb_frames) const\r
395         {\r
396                 switch(display_mode_)\r
397                 {\r
398                 case display_mode::interlace:\r
399                 case display_mode::half:\r
400                         return nb_frames/2;\r
401                 case display_mode::duplicate:\r
402                 case display_mode::deinterlace_bob:\r
403                         return nb_frames*2;\r
404                 default:\r
405                         return nb_frames;\r
406                 }\r
407         }\r
408 };\r
409 \r
410 frame_muxer::frame_muxer(double in_fps, const safe_ptr<core::frame_factory>& frame_factory)\r
411         : impl_(new implementation(in_fps, frame_factory)){}\r
412 void frame_muxer::push(const std::shared_ptr<AVFrame>& video_frame, int hints){impl_->push(video_frame, hints);}\r
413 void frame_muxer::push(const std::shared_ptr<std::vector<int32_t>>& audio_samples){return impl_->push(audio_samples);}\r
414 void frame_muxer::commit(){impl_->commit();}\r
415 safe_ptr<basic_frame> frame_muxer::pop(){return impl_->pop();}\r
416 size_t frame_muxer::size() const {return impl_->size();}\r
417 bool frame_muxer::empty() const {return impl_->size() == 0;}\r
418 bool frame_muxer::video_ready() const{return impl_->video_ready();}\r
419 bool frame_muxer::audio_ready() const{return impl_->audio_ready();}\r
420 int64_t frame_muxer::calc_nb_frames(int64_t nb_frames) const {return impl_->calc_nb_frames(nb_frames);}\r
421 \r
422 }