]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/frame_muxer.cpp
git-svn-id: https://casparcg.svn.sourceforge.net/svnroot/casparcg/server/branches...
[casparcg] / modules / ffmpeg / producer / frame_muxer.cpp
1 #include "../StdAfx.h"\r
2 \r
3 #include "frame_muxer.h"\r
4 \r
5 #include "filter/filter.h"\r
6 \r
7 #include "util.h"\r
8 \r
9 #include <core/producer/frame/basic_frame.h>\r
10 #include <core/producer/frame/image_transform.h>\r
11 #include <core/producer/frame/pixel_format.h>\r
12 #include <core/producer/frame/frame_factory.h>\r
13 #include <core/mixer/write_frame.h>\r
14 \r
15 #include <common/env.h>\r
16 #include <common/log/log.h>\r
17 \r
18 #include <boost/range/algorithm_ext/push_back.hpp>\r
19 \r
20 using namespace caspar::core;\r
21 \r
22 namespace caspar {\r
23 \r
24 struct display_mode\r
25 {\r
26         enum type\r
27         {\r
28                 simple,\r
29                 duplicate,\r
30                 half,\r
31                 interlace,\r
32                 deinterlace_bob,\r
33                 deinterlace_bob_reinterlace,\r
34                 deinterlace,\r
35                 count,\r
36                 invalid\r
37         };\r
38 \r
39         static std::wstring print(display_mode::type value)\r
40         {\r
41                 switch(value)\r
42                 {\r
43                         case simple:\r
44                                 return L"simple";\r
45                         case duplicate:\r
46                                 return L"duplicate";\r
47                         case half:\r
48                                 return L"half";\r
49                         case interlace:\r
50                                 return L"interlace";\r
51                         case deinterlace_bob:\r
52                                 return L"deinterlace_bob";\r
53                         case deinterlace_bob_reinterlace:\r
54                                 return L"deinterlace_bob_reinterlace";\r
55                         case deinterlace:\r
56                                 return L"deinterlace";\r
57                         default:\r
58                                 return L"invalid";\r
59                 }\r
60         }\r
61 };\r
62 \r
63 display_mode::type get_display_mode(const core::video_mode::type in_mode, double in_fps, const core::video_mode::type out_mode, double out_fps)\r
64 {               \r
65         if(in_mode == core::video_mode::invalid || out_mode == core::video_mode::invalid)\r
66                 return display_mode::invalid;\r
67 \r
68         static const auto epsilon = 2.0;\r
69 \r
70         if(std::abs(in_fps - out_fps) < epsilon)\r
71         {\r
72                 if(in_mode != core::video_mode::progressive && out_mode == core::video_mode::progressive)\r
73                         return display_mode::deinterlace;\r
74                 //else if(in_mode == core::video_mode::progressive && out_mode != core::video_mode::progressive)\r
75                 //      simple(); // interlace_duplicate();\r
76                 else\r
77                         return display_mode::simple;\r
78         }\r
79         else if(std::abs(in_fps/2.0 - out_fps) < epsilon)\r
80         {\r
81                 if(in_mode != core::video_mode::progressive)\r
82                         return display_mode::invalid;\r
83 \r
84                 if(out_mode != core::video_mode::progressive)\r
85                         return display_mode::interlace;\r
86                 else\r
87                         return display_mode::half;\r
88         }\r
89         else if(std::abs(in_fps - out_fps/2.0) < epsilon)\r
90         {\r
91                 if(out_mode != core::video_mode::progressive)\r
92                         return display_mode::invalid;\r
93 \r
94                 if(in_mode != core::video_mode::progressive)\r
95                         return display_mode::deinterlace_bob;\r
96                 else\r
97                         return display_mode::duplicate;\r
98         }\r
99 \r
100         return display_mode::invalid;\r
101 }\r
102 \r
103 struct frame_muxer::implementation : boost::noncopyable\r
104 {       \r
105         std::deque<std::queue<safe_ptr<write_frame>>>   video_streams_;\r
106         std::deque<std::vector<int16_t>>                                audio_streams_;\r
107         std::deque<safe_ptr<basic_frame>>                               frame_buffer_;\r
108         display_mode::type                                                              display_mode_;\r
109         const double                                                                    in_fps_;\r
110         const video_format_desc                                                 format_desc_;\r
111         bool                                                                                    auto_mode_;\r
112 \r
113         size_t                                                                                  audio_sample_count_;\r
114         size_t                                                                                  video_frame_count_;\r
115                 \r
116         size_t                                                                                  processed_audio_sample_count_;\r
117         size_t                                                                                  processed_video_frame_count_;\r
118 \r
119         std::unique_ptr<filter>                                                 filter_;\r
120         safe_ptr<core::frame_factory>                                   frame_factory_;\r
121                 \r
122         implementation(double in_fps, const video_format_desc& format_desc, const safe_ptr<core::frame_factory>& frame_factory)\r
123                 : display_mode_(display_mode::invalid)\r
124                 , in_fps_(in_fps)\r
125                 , format_desc_(format_desc)\r
126                 , auto_mode_(env::properties().get("configuration.auto-mode", false))\r
127                 , audio_sample_count_(0)\r
128                 , video_frame_count_(0)\r
129                 , frame_factory_(frame_factory)\r
130                 , video_streams_(1)\r
131                 , audio_streams_(1)\r
132         {\r
133         }\r
134 \r
135         void push(const std::shared_ptr<AVFrame>& video_frame)\r
136         {               \r
137                 if(!video_frame)\r
138                 {       \r
139                         CASPAR_LOG(debug) << L"video-frame-count: " << static_cast<float>(video_frame_count_);\r
140                         video_frame_count_ = 0;\r
141                         video_streams_.push_back(std::queue<safe_ptr<write_frame>>());\r
142                         return;\r
143                 }\r
144 \r
145                 if(video_frame->data[0] == nullptr)\r
146                 {\r
147                         video_streams_.back().push(make_safe<core::write_frame>(this));\r
148                         ++video_frame_count_;\r
149                         process(frame_buffer_);\r
150                         return;\r
151                 }\r
152                 \r
153                 if(display_mode_ == display_mode::invalid)\r
154                 {\r
155                         auto in_mode = get_mode(*video_frame);\r
156                         display_mode_ = auto_mode_ ? get_display_mode(in_mode, in_fps_, format_desc_.mode, format_desc_.fps) : display_mode::simple;\r
157                         \r
158                         if(display_mode_ == display_mode::simple && in_mode != core::video_mode::progressive && format_desc_.mode != core::video_mode::progressive && video_frame->height != static_cast<int>(format_desc_.height))\r
159                                 display_mode_ = display_mode::deinterlace_bob_reinterlace; // The frame will most likely be scaled, we need to deinterlace->reinterlace         \r
160                 }\r
161                 \r
162                 std::vector<safe_ptr<core::write_frame>> frames;\r
163 \r
164                 if(display_mode_ == display_mode::deinterlace)\r
165                 {\r
166                         if(!filter_)\r
167                                 filter_.reset(new filter(L"YADIF=0:-1"));\r
168 \r
169                         BOOST_FOREACH(auto& frame, filter_->execute(video_frame))\r
170                                 frames.push_back(make_write_frame(this, frame, frame_factory_));\r
171 \r
172                 }\r
173                 else if(display_mode_ == display_mode::deinterlace_bob || display_mode_ == display_mode::deinterlace_bob_reinterlace)\r
174                 {\r
175                         if(!filter_)\r
176                                 filter_.reset(new filter(L"YADIF=1:-1"));\r
177 \r
178                         BOOST_FOREACH(auto& frame, filter_->execute(video_frame))\r
179                                 frames.push_back(make_write_frame(this, frame, frame_factory_));\r
180                 }\r
181                 else\r
182                         frames.push_back(make_write_frame(this, make_safe(video_frame), frame_factory_));\r
183 \r
184                 BOOST_FOREACH(auto& frame, frames)\r
185                 {\r
186                         // Fix field-order if needed\r
187                         if(frame->get_type() == core::video_mode::lower && format_desc_.mode == core::video_mode::upper)\r
188                                 frame->get_image_transform().set_fill_translation(0.0f, 0.5/static_cast<double>(frame->get_pixel_format_desc().planes[0].height));\r
189                         else if(frame->get_type() == core::video_mode::upper && format_desc_.mode == core::video_mode::lower)\r
190                                 frame->get_image_transform().set_fill_translation(0.0f, -0.5/static_cast<double>(frame->get_pixel_format_desc().planes[0].height));\r
191 \r
192                         video_streams_.back().push(frame);\r
193                         ++video_frame_count_;\r
194 \r
195                         process(frame_buffer_);\r
196                 }\r
197         }\r
198 \r
199         void push(const std::shared_ptr<std::vector<int16_t>>& audio_samples)\r
200         {\r
201                 if(!audio_samples)      \r
202                 {\r
203                         CASPAR_LOG(debug) << L"audio-chunk-count: " << audio_sample_count_/format_desc_.audio_samples_per_frame;\r
204                         audio_streams_.push_back(std::vector<int16_t>());\r
205                         audio_sample_count_ = 0;\r
206                         return;\r
207                 }\r
208 \r
209                 audio_sample_count_ += audio_samples->size();\r
210 \r
211                 boost::range::push_back(audio_streams_.back(), *audio_samples);\r
212                 process(frame_buffer_);\r
213         }\r
214 \r
215         safe_ptr<basic_frame> pop()\r
216         {               \r
217                 auto frame = frame_buffer_.front();\r
218                 frame_buffer_.pop_front();              \r
219                 return frame;\r
220         }\r
221 \r
222         size_t size() const\r
223         {\r
224                 return frame_buffer_.size();\r
225         }\r
226 \r
227         safe_ptr<core::write_frame> pop_video()\r
228         {\r
229                 auto frame = video_streams_.front().front();\r
230                 video_streams_.front().pop();\r
231                 \r
232                 return frame;\r
233         }\r
234 \r
235         std::vector<int16_t> pop_audio()\r
236         {\r
237                 CASPAR_VERIFY(audio_streams_.front().size() >= format_desc_.audio_samples_per_frame);\r
238 \r
239                 auto begin = audio_streams_.front().begin();\r
240                 auto end   = begin + format_desc_.audio_samples_per_frame;\r
241 \r
242                 auto samples = std::vector<int16_t>(begin, end);\r
243                 audio_streams_.front().erase(begin, end);\r
244 \r
245                 return samples;\r
246         }\r
247 \r
248         bool video_ready() const\r
249         {\r
250                 return video_frames() > 1 && video_streams_.size() >= audio_streams_.size();\r
251         }\r
252         \r
253         bool audio_ready() const\r
254         {\r
255                 return audio_chunks() > 1 && audio_streams_.size() >= video_streams_.size();\r
256         }\r
257 \r
258         size_t video_frames() const\r
259         {\r
260                 return video_streams_.back().size();\r
261         }\r
262 \r
263         size_t audio_chunks() const\r
264         {\r
265                 return audio_streams_.back().size() / format_desc_.audio_samples_per_frame;\r
266         }\r
267         \r
268         void process(std::deque<safe_ptr<basic_frame>>& dest)\r
269         {\r
270                 if(video_streams_.size() > 1 && audio_streams_.size() > 1 &&\r
271                         (video_streams_.front().empty() || audio_streams_.front().empty()))\r
272                 {\r
273                         if(!video_streams_.front().empty() || !audio_streams_.front().empty())\r
274                                 CASPAR_LOG(debug) << "Truncating: " << video_streams_.front().size() << L" video-frames, " << audio_streams_.front().size() << L" audio-samples.";\r
275 \r
276                         video_streams_.pop_front();\r
277                         audio_streams_.pop_front();\r
278                 }\r
279 \r
280                 if(video_streams_.front().empty() || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
281                         return;\r
282                 \r
283                 switch(display_mode_)\r
284                 {\r
285                 case display_mode::simple:                                              return simple(dest);\r
286                 case display_mode::duplicate:                                   return duplicate(dest);\r
287                 case display_mode::half:                                                return half(dest);\r
288                 case display_mode::interlace:                                   return interlace(dest);\r
289                 case display_mode::deinterlace_bob:                             return simple(dest);\r
290                 case display_mode::deinterlace_bob_reinterlace: return interlace(dest);\r
291                 case display_mode::deinterlace:                                 return simple(dest);\r
292                 default:                                                                                BOOST_THROW_EXCEPTION(invalid_operation());\r
293                 }\r
294         }\r
295 \r
296         void simple(std::deque<safe_ptr<basic_frame>>& dest)\r
297         {\r
298                 if(video_streams_.front().empty() || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
299                         return;\r
300                 \r
301                 auto frame1 = pop_video();\r
302                 frame1->commit();\r
303                 frame1->audio_data() = pop_audio();\r
304 \r
305                 dest.push_back(frame1);         \r
306         }\r
307 \r
308         void duplicate(std::deque<safe_ptr<basic_frame>>& dest)\r
309         {               \r
310                 if(video_streams_.front().empty() || audio_streams_.front().size()/2 < format_desc_.audio_samples_per_frame)\r
311                         return;\r
312 \r
313                 auto frame = pop_video();\r
314                 frame->commit();\r
315 \r
316                 auto frame1 = make_safe<core::write_frame>(*frame); // make a copy\r
317                 frame1->audio_data() = pop_audio();\r
318 \r
319                 auto frame2 = frame;\r
320                 frame2->audio_data() = pop_audio();\r
321 \r
322                 dest.push_back(frame1);\r
323                 dest.push_back(frame2);\r
324         }\r
325 \r
326         void half(std::deque<safe_ptr<basic_frame>>& dest)\r
327         {       \r
328                 if(video_streams_.front().size() < 2 || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
329                         return;\r
330                                                 \r
331                 auto frame1 = pop_video();\r
332                 frame1->commit();\r
333                 frame1->audio_data() = pop_audio();\r
334                                 \r
335                 video_streams_.front().pop(); // Throw away\r
336 \r
337                 dest.push_back(frame1);\r
338         }\r
339         \r
340         void interlace(std::deque<safe_ptr<basic_frame>>& dest)\r
341         {               \r
342                 if(video_streams_.front().size() < 2 || audio_streams_.front().size() < format_desc_.audio_samples_per_frame)\r
343                         return;\r
344                 \r
345                 auto frame1 = pop_video();\r
346                 frame1->commit();\r
347 \r
348                 frame1->audio_data() = pop_audio();\r
349                                 \r
350                 auto frame2 = pop_video();\r
351 \r
352                 dest.push_back(core::basic_frame::interlace(frame1, frame2, format_desc_.mode));                \r
353         }\r
354 };\r
355 \r
356 frame_muxer::frame_muxer(double in_fps, const video_format_desc& format_desc, const safe_ptr<core::frame_factory>& frame_factory)\r
357         : impl_(new implementation(in_fps, format_desc, frame_factory)){}\r
358 void frame_muxer::push(const std::shared_ptr<AVFrame>& video_frame){impl_->push(video_frame);}\r
359 void frame_muxer::push(const std::shared_ptr<std::vector<int16_t>>& audio_samples){return impl_->push(audio_samples);}\r
360 safe_ptr<basic_frame> frame_muxer::pop(){return impl_->pop();}\r
361 size_t frame_muxer::size() const {return impl_->size();}\r
362 bool frame_muxer::empty() const {return impl_->size() == 0;}\r
363 bool frame_muxer::video_ready() const{return impl_->video_ready();}\r
364 bool frame_muxer::audio_ready() const{return impl_->audio_ready();}\r
365 \r
366 }