]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/video/video_decoder.cpp
702a4690aa046fc84bcb4e02396d14948d09fd05
[casparcg] / modules / ffmpeg / producer / video / video_decoder.cpp
1 /*\r
2 * copyright (c) 2010 Sveriges Television AB <info@casparcg.com>\r
3 *\r
4 *  This file is part of CasparCG.\r
5 *\r
6 *    CasparCG is free software: you can redistribute it and/or modify\r
7 *    it under the terms of the GNU General Public License as published by\r
8 *    the Free Software Foundation, either version 3 of the License, or\r
9 *    (at your option) any later version.\r
10 *\r
11 *    CasparCG is distributed in the hope that it will be useful,\r
12 *    but WITHOUT ANY WARRANTY; without even the implied warranty of\r
13 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\r
14 *    GNU General Public License for more details.\r
15 \r
16 *    You should have received a copy of the GNU General Public License\r
17 *    along with CasparCG.  If not, see <http://www.gnu.org/licenses/>.\r
18 *\r
19 */\r
20 #include "../../stdafx.h"\r
21 \r
22 #include "video_decoder.h"\r
23 #include "pix_fmt.h"\r
24 \r
25 #include "../../ffmpeg_error.h"\r
26 #include "../filter/filter.h"\r
27 \r
28 #include <common/memory/memcpy.h>\r
29 \r
30 #include <core/video_format.h>\r
31 #include <core/producer/frame/basic_frame.h>\r
32 #include <core/mixer/write_frame.h>\r
33 #include <core/producer/frame/image_transform.h>\r
34 #include <core/producer/frame/pixel_format.h>\r
35 #include <core/producer/frame/frame_factory.h>\r
36 \r
37 #include <tbb/parallel_for.h>\r
38 \r
39 #include <boost/range/algorithm_ext.hpp>\r
40 \r
41 #if defined(_MSC_VER)\r
42 #pragma warning (push)\r
43 #pragma warning (disable : 4244)\r
44 #endif\r
45 extern "C" \r
46 {\r
47         #define __STDC_CONSTANT_MACROS\r
48         #define __STDC_LIMIT_MACROS\r
49         #include <libswscale/swscale.h>\r
50         #include <libavformat/avformat.h>\r
51         #include <libavcodec/avcodec.h>\r
52 }\r
53 #if defined(_MSC_VER)\r
54 #pragma warning (pop)\r
55 #endif\r
56 \r
57 namespace caspar {\r
58         \r
59 struct video_decoder::implementation : boost::noncopyable\r
60 {\r
61         input& input_;\r
62         std::shared_ptr<SwsContext>                                     sws_context_;\r
63         const std::shared_ptr<core::frame_factory>      frame_factory_;\r
64         AVCodecContext&                                                         codec_context_;\r
65         size_t                                                                          frame_number_;\r
66 \r
67         std::shared_ptr<filter>                                         filter_;\r
68         size_t                                                                          filter_delay_;\r
69         size_t                                                                          filter_skip_;\r
70 \r
71         std::shared_ptr<AVFrame>                                        last_frame_;\r
72         std::shared_ptr<AVFrame>                                        decoded_frame_;\r
73         std::string                                                                     filter_str_;\r
74 \r
75 public:\r
76         explicit implementation(input& input, const safe_ptr<core::frame_factory>& frame_factory, const std::string& filter_str) \r
77                 : input_(input)\r
78                 , frame_factory_(frame_factory)\r
79                 , codec_context_(*input_.get_video_codec_context())\r
80                 , frame_number_(0)\r
81                 , filter_(filter_str.empty() ? nullptr : new filter(filter_str))\r
82                 , filter_delay_(0)\r
83                 , filter_skip_(0)\r
84                 , last_frame_(avcodec_alloc_frame(), av_free)\r
85                 , filter_str_(filter_str)\r
86         {\r
87         }\r
88 \r
89         std::deque<std::pair<int, safe_ptr<core::write_frame>>> receive()\r
90         {\r
91                 std::deque<std::pair<int, safe_ptr<core::write_frame>>> result;\r
92                 \r
93                 std::shared_ptr<AVPacket> pkt;\r
94                 for(int n = 0; n < 32 && result.empty() && input_.try_pop_video_packet(pkt); ++n)       \r
95                         boost::range::push_back(result, decode(pkt));\r
96 \r
97                 return result;\r
98         }\r
99 \r
100         std::deque<std::pair<int, safe_ptr<core::write_frame>>> decode(const std::shared_ptr<AVPacket>& video_packet)\r
101         {                       \r
102                 std::deque<std::pair<int, safe_ptr<core::write_frame>>> result;\r
103                 \r
104                 if(!video_packet) // eof\r
105                         return flush();\r
106 \r
107                 if(filter_)\r
108                 {\r
109                         if(decoded_frame_)\r
110                                 push_filter_frames(make_safe(decoded_frame_));  \r
111                         \r
112                         std::shared_ptr<AVFrame> frame;\r
113 \r
114                         tbb::parallel_invoke(\r
115                         [&]\r
116                         {\r
117                                 frame = decode_frame(video_packet);\r
118                         },\r
119                         [&]\r
120                         {\r
121                                 if(decoded_frame_)\r
122                                         result = poll_filter_frames();\r
123                         });             \r
124 \r
125                         decoded_frame_ = frame;\r
126                         if(frame)\r
127                                 last_frame_ = frame;                    \r
128                 }\r
129                 else\r
130                 {\r
131                         auto frame = decode_frame(video_packet);\r
132                         \r
133                         if(frame)\r
134                                 result.push_back(std::make_pair(frame_number_++, make_write_frame(make_safe(frame))));\r
135                 }\r
136 \r
137                 return result;\r
138         }\r
139 \r
140         std::deque<std::pair<int, safe_ptr<core::write_frame>>> flush()\r
141         {\r
142                 std::deque<std::pair<int, safe_ptr<core::write_frame>>> result;\r
143 \r
144                 if(filter_)\r
145                 {\r
146                         // Get all buffered frames\r
147                         if(decoded_frame_)\r
148                         {       \r
149                                 push_filter_frames(make_safe(decoded_frame_));  \r
150                                 boost::range::push_back(result, poll_filter_frames());\r
151                         }\r
152 \r
153                         for(size_t n = 0; n < filter_delay_; ++n)\r
154                         {                                       \r
155                                 push_filter_frames(make_safe(last_frame_));     \r
156                                 boost::range::push_back(result, poll_filter_frames());\r
157                         }\r
158 \r
159                         // FIXME: Unnecessary reinitialization\r
160                         filter_skip_ = filter_delay_;\r
161                         decoded_frame_ = nullptr;\r
162                 }\r
163 \r
164                 frame_number_ = 0;\r
165                 avcodec_flush_buffers(&codec_context_);\r
166 \r
167                 return result;\r
168         }\r
169 \r
170         void push_filter_frames(const safe_ptr<AVFrame>& frame)\r
171         {               \r
172                 filter_->push(frame);           \r
173         }\r
174 \r
175         std::deque<std::pair<int, safe_ptr<core::write_frame>>> poll_filter_frames()\r
176         {\r
177                 std::deque<std::pair<int, safe_ptr<core::write_frame>>> result;\r
178                                 \r
179                 if(filter_skip_ > 0)\r
180                 {\r
181                         --filter_skip_;\r
182                         filter_->skip();\r
183                         return result;\r
184                 }\r
185 \r
186                 auto frames = filter_->poll(); \r
187 \r
188                 boost::range::transform(frames, std::back_inserter(result), [&](const safe_ptr<AVFrame>& frame)\r
189                 {\r
190                         return std::make_pair(frame_number_, make_write_frame(frame));\r
191                 });\r
192                 \r
193                 if(!frames.empty())\r
194                         ++frame_number_;\r
195                 else            \r
196                         ++filter_delay_;                \r
197 \r
198                 return result;\r
199         }\r
200         \r
201         std::shared_ptr<AVFrame> decode_frame(const std::shared_ptr<AVPacket>& video_packet)\r
202         {\r
203                 std::shared_ptr<AVFrame> decoded_frame(avcodec_alloc_frame(), av_free);\r
204 \r
205                 int frame_finished = 0;\r
206                 const int errn = avcodec_decode_video2(&codec_context_, decoded_frame.get(), &frame_finished, video_packet.get());\r
207                 \r
208                 if(errn < 0)\r
209                 {\r
210                         BOOST_THROW_EXCEPTION(\r
211                                 invalid_operation() <<\r
212                                 msg_info(av_error_str(errn)) <<\r
213                                 boost::errinfo_api_function("avcodec_decode_video") <<\r
214                                 boost::errinfo_errno(AVUNERROR(errn)));\r
215                 }\r
216 \r
217                 if(frame_finished == 0)         \r
218                         decoded_frame = nullptr;\r
219 \r
220                 return decoded_frame;\r
221         }\r
222 \r
223         safe_ptr<core::write_frame> make_write_frame(safe_ptr<AVFrame> decoded_frame)\r
224         {                       \r
225                 // We don't know what the filter output might give until we received the first frame. Initialize everything on first frame.\r
226                 auto width   = decoded_frame->width;\r
227                 auto height  = decoded_frame->height;\r
228                 auto pix_fmt = static_cast<PixelFormat>(decoded_frame->format);\r
229                 auto desc        = get_pixel_format_desc(pix_fmt, width, height);\r
230                         \r
231                 if(desc.pix_fmt == core::pixel_format::invalid)\r
232                 {\r
233                         CASPAR_VERIFY(!sws_context_); // Initialize only once. Nothing should change while running;\r
234                         CASPAR_LOG(warning) << "Hardware accelerated color transform not supported.";\r
235 \r
236                         desc = get_pixel_format_desc(PIX_FMT_BGRA, width, height);\r
237                         double param;\r
238                         sws_context_.reset(sws_getContext(width, height, pix_fmt, width, height, PIX_FMT_BGRA, SWS_BILINEAR, nullptr, nullptr, &param), sws_freeContext);\r
239                         if(!sws_context_)\r
240                                 BOOST_THROW_EXCEPTION(operation_failed() <<\r
241                                                                           msg_info("Could not create software scaling context.") << \r
242                                                                           boost::errinfo_api_function("sws_getContext"));\r
243                 }\r
244 \r
245                 auto write = frame_factory_->create_frame(this, desc);\r
246                 write->set_is_interlaced(decoded_frame->interlaced_frame != 0);\r
247 \r
248                 if(sws_context_ == nullptr)\r
249                 {\r
250                         tbb::parallel_for(0, static_cast<int>(desc.planes.size()), 1, [&](int n)\r
251                         {\r
252                                 auto plane            = desc.planes[n];\r
253                                 auto result           = write->image_data(n).begin();\r
254                                 auto decoded          = decoded_frame->data[n];\r
255                                 auto decoded_linesize = decoded_frame->linesize[n];\r
256                                 \r
257                                 // Copy line by line since ffmpeg sometimes pads each line.\r
258                                 tbb::parallel_for(tbb::blocked_range<size_t>(0, static_cast<int>(desc.planes[n].height)), [&](const tbb::blocked_range<size_t>& r)\r
259                                 {\r
260                                         for(size_t y = r.begin(); y != r.end(); ++y)\r
261                                                 memcpy(result + y*plane.linesize, decoded + y*decoded_linesize, plane.linesize);\r
262                                 });\r
263 \r
264                                 write->commit(n);\r
265                         });\r
266                 }\r
267                 else\r
268                 {\r
269                         // Use sws_scale when provided colorspace has no hw-accel.\r
270                         safe_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);     \r
271                         avcodec_get_frame_defaults(av_frame.get());                     \r
272                         avpicture_fill(reinterpret_cast<AVPicture*>(av_frame.get()), write->image_data().begin(), PIX_FMT_BGRA, width, height);\r
273                  \r
274                         sws_scale(sws_context_.get(), decoded_frame->data, decoded_frame->linesize, 0, height, av_frame->data, av_frame->linesize);     \r
275 \r
276                         write->commit();\r
277                 }       \r
278 \r
279                 // Fix field-order if needed. DVVIDEO is in lower field. Make it upper field if needed.\r
280                 if(decoded_frame->interlaced_frame)\r
281                 {\r
282                         switch(frame_factory_->get_video_format_desc().mode)\r
283                         {\r
284                         case core::video_mode::upper:\r
285                                 if(!decoded_frame->top_field_first)\r
286                                         write->get_image_transform().set_fill_translation(0.0f, 0.5/static_cast<double>(height));\r
287                                 break;\r
288                         case core::video_mode::lower:\r
289                                 if(decoded_frame->top_field_first)\r
290                                         write->get_image_transform().set_fill_translation(0.0f, -0.5/static_cast<double>(height));\r
291                                 break;\r
292                         }\r
293                 }\r
294 \r
295                 return write;\r
296         }\r
297 };\r
298 \r
299 video_decoder::video_decoder(input& input, const safe_ptr<core::frame_factory>& frame_factory, const std::string& filter_str) : impl_(new implementation(input, frame_factory, filter_str)){}\r
300 std::deque<std::pair<int, safe_ptr<core::write_frame>>> video_decoder::receive(){return impl_->receive();}\r
301 \r
302 }