]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/util/util.cpp
2.0.2: MAYOR CHANGES => needs testing
[casparcg] / modules / ffmpeg / producer / util / util.cpp
1 #include "../../stdafx.h"\r
2 \r
3 #include "util.h"\r
4 \r
5 #include "flv.h"\r
6 \r
7 #include "../../ffmpeg_error.h"\r
8 \r
9 #include <tbb/concurrent_unordered_map.h>\r
10 #include <tbb/concurrent_queue.h>\r
11 \r
12 #include <core/producer/frame/frame_transform.h>\r
13 #include <core/producer/frame/frame_factory.h>\r
14 #include <core/producer/frame_producer.h>\r
15 #include <core/mixer/write_frame.h>\r
16 \r
17 #include <common/exception/exceptions.h>\r
18 #include <common/utility/assert.h>\r
19 #include <common/memory/memcpy.h>\r
20 \r
21 #include <tbb/parallel_for.h>\r
22 \r
23 #include <boost/filesystem.hpp>\r
24 #include <boost/lexical_cast.hpp>\r
25 \r
26 #if defined(_MSC_VER)\r
27 #pragma warning (push)\r
28 #pragma warning (disable : 4244)\r
29 #endif\r
30 extern "C" \r
31 {\r
32         #include <libswscale/swscale.h>\r
33         #include <libavcodec/avcodec.h>\r
34         #include <libavformat/avformat.h>\r
35 }\r
36 #if defined(_MSC_VER)\r
37 #pragma warning (pop)\r
38 #endif\r
39 \r
40 namespace caspar { namespace ffmpeg {\r
41                 \r
42 safe_ptr<AVPacket> flush_packet()\r
43 {\r
44         static auto packet = create_packet();\r
45         return packet;\r
46 }\r
47 \r
48 std::shared_ptr<core::audio_buffer> flush_audio()\r
49 {\r
50         static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());\r
51         return audio;\r
52 }\r
53 \r
54 std::shared_ptr<core::audio_buffer> empty_audio()\r
55 {\r
56         static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());\r
57         return audio;\r
58 }\r
59 \r
60 std::shared_ptr<AVFrame>                        flush_video()\r
61 {\r
62         static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);\r
63         return video;\r
64 }\r
65 \r
66 std::shared_ptr<AVFrame>                        empty_video()\r
67 {\r
68         static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);\r
69         return video;\r
70 }\r
71 \r
72 core::field_mode::type get_mode(const AVFrame& frame)\r
73 {\r
74         if(!frame.interlaced_frame)\r
75                 return core::field_mode::progressive;\r
76 \r
77         return frame.top_field_first ? core::field_mode::upper : core::field_mode::lower;\r
78 }\r
79 \r
80 core::pixel_format::type get_pixel_format(PixelFormat pix_fmt)\r
81 {\r
82         switch(pix_fmt)\r
83         {\r
84         case CASPAR_PIX_FMT_LUMA:       return core::pixel_format::luma;\r
85         case PIX_FMT_GRAY8:                     return core::pixel_format::gray;\r
86         case PIX_FMT_BGRA:                      return core::pixel_format::bgra;\r
87         case PIX_FMT_ARGB:                      return core::pixel_format::argb;\r
88         case PIX_FMT_RGBA:                      return core::pixel_format::rgba;\r
89         case PIX_FMT_ABGR:                      return core::pixel_format::abgr;\r
90         case PIX_FMT_YUV444P:           return core::pixel_format::ycbcr;\r
91         case PIX_FMT_YUV422P:           return core::pixel_format::ycbcr;\r
92         case PIX_FMT_YUV420P:           return core::pixel_format::ycbcr;\r
93         case PIX_FMT_YUV411P:           return core::pixel_format::ycbcr;\r
94         case PIX_FMT_YUV410P:           return core::pixel_format::ycbcr;\r
95         case PIX_FMT_YUVA420P:          return core::pixel_format::ycbcra;\r
96         default:                                        return core::pixel_format::invalid;\r
97         }\r
98 }\r
99 \r
100 core::pixel_format_desc get_pixel_format_desc(PixelFormat pix_fmt, size_t width, size_t height)\r
101 {\r
102         // Get linesizes\r
103         AVPicture dummy_pict;   \r
104         avpicture_fill(&dummy_pict, nullptr, pix_fmt == CASPAR_PIX_FMT_LUMA ? PIX_FMT_GRAY8 : pix_fmt, width, height);\r
105 \r
106         core::pixel_format_desc desc;\r
107         desc.pix_fmt = get_pixel_format(pix_fmt);\r
108                 \r
109         switch(desc.pix_fmt)\r
110         {\r
111         case core::pixel_format::gray:\r
112         case core::pixel_format::luma:\r
113                 {\r
114                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));                                               \r
115                         return desc;\r
116                 }\r
117         case core::pixel_format::bgra:\r
118         case core::pixel_format::argb:\r
119         case core::pixel_format::rgba:\r
120         case core::pixel_format::abgr:\r
121                 {\r
122                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0]/4, height, 4));                                             \r
123                         return desc;\r
124                 }\r
125         case core::pixel_format::ycbcr:\r
126         case core::pixel_format::ycbcra:\r
127                 {               \r
128                         // Find chroma height\r
129                         size_t size2 = dummy_pict.data[2] - dummy_pict.data[1];\r
130                         size_t h2 = size2/dummy_pict.linesize[1];                       \r
131 \r
132                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));\r
133                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[1], h2, 1));\r
134                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[2], h2, 1));\r
135 \r
136                         if(desc.pix_fmt == core::pixel_format::ycbcra)                                          \r
137                                 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[3], height, 1));       \r
138                         return desc;\r
139                 }               \r
140         default:                \r
141                 desc.pix_fmt = core::pixel_format::invalid;\r
142                 return desc;\r
143         }\r
144 }\r
145 \r
146 int make_alpha_format(int format)\r
147 {\r
148         switch(get_pixel_format(static_cast<PixelFormat>(format)))\r
149         {\r
150         case core::pixel_format::ycbcr:\r
151         case core::pixel_format::ycbcra:\r
152                 return CASPAR_PIX_FMT_LUMA;\r
153         default:\r
154                 return format;\r
155         }\r
156 }\r
157 \r
158 safe_ptr<core::write_frame> make_write_frame(const void* tag, const safe_ptr<AVFrame>& decoded_frame, const safe_ptr<core::frame_factory>& frame_factory, int hints)\r
159 {                       \r
160         static tbb::concurrent_unordered_map<size_t, tbb::concurrent_queue<std::shared_ptr<SwsContext>>> sws_contexts_;\r
161         \r
162         if(decoded_frame->width < 1 || decoded_frame->height < 1)\r
163                 return make_safe<core::write_frame>(tag);\r
164 \r
165         const auto width  = decoded_frame->width;\r
166         const auto height = decoded_frame->height;\r
167         auto desc                 = get_pixel_format_desc(static_cast<PixelFormat>(decoded_frame->format), width, height);\r
168         \r
169         if(hints & core::frame_producer::ALPHA_HINT)\r
170                 desc = get_pixel_format_desc(static_cast<PixelFormat>(make_alpha_format(decoded_frame->format)), width, height);\r
171 \r
172         std::shared_ptr<core::write_frame> write;\r
173 \r
174         if(desc.pix_fmt == core::pixel_format::invalid)\r
175         {\r
176                 auto pix_fmt = static_cast<PixelFormat>(decoded_frame->format);\r
177 \r
178                 write = frame_factory->create_frame(tag, get_pixel_format_desc(PIX_FMT_BGRA, width, height));\r
179                 write->set_type(get_mode(*decoded_frame));\r
180 \r
181                 std::shared_ptr<SwsContext> sws_context;\r
182 \r
183                 //CASPAR_LOG(warning) << "Hardware accelerated color transform not supported.";\r
184 \r
185                 size_t key = width << 20 | height << 8 | pix_fmt;\r
186                         \r
187                 auto& pool = sws_contexts_[key];\r
188                                                 \r
189                 if(!pool.try_pop(sws_context))\r
190                 {\r
191                         double param;\r
192                         sws_context.reset(sws_getContext(width, height, pix_fmt, width, height, PIX_FMT_BGRA, SWS_BILINEAR, nullptr, nullptr, &param), sws_freeContext);\r
193                 }\r
194                         \r
195                 if(!sws_context)\r
196                 {\r
197                         BOOST_THROW_EXCEPTION(operation_failed() << msg_info("Could not create software scaling context.") << \r
198                                                                         boost::errinfo_api_function("sws_getContext"));\r
199                 }       \r
200 \r
201                 // Use sws_scale when provided colorspace has no hw-accel.\r
202                 safe_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);     \r
203                 avcodec_get_frame_defaults(av_frame.get());                     \r
204                 avpicture_fill(reinterpret_cast<AVPicture*>(av_frame.get()), write->image_data().begin(), PIX_FMT_BGRA, width, height);\r
205                  \r
206                 sws_scale(sws_context.get(), decoded_frame->data, decoded_frame->linesize, 0, height, av_frame->data, av_frame->linesize);      \r
207                 pool.push(sws_context);\r
208 \r
209                 write->commit();\r
210         }\r
211         else\r
212         {\r
213                 write = frame_factory->create_frame(tag, desc);\r
214                 write->set_type(get_mode(*decoded_frame));\r
215 \r
216                 for(int n = 0; n < static_cast<int>(desc.planes.size()); ++n)\r
217                 {\r
218                         auto plane            = desc.planes[n];\r
219                         auto result           = write->image_data(n).begin();\r
220                         auto decoded          = decoded_frame->data[n];\r
221                         auto decoded_linesize = decoded_frame->linesize[n];\r
222                         \r
223                         CASPAR_ASSERT(decoded);\r
224                         CASPAR_ASSERT(write->image_data(n).begin());\r
225 \r
226                         if(decoded_linesize != static_cast<int>(plane.width))\r
227                         {\r
228                                 // Copy line by line since ffmpeg sometimes pads each line.\r
229                                 tbb::parallel_for<size_t>(0, desc.planes[n].height, [&](size_t y)\r
230                                 {\r
231                                         fast_memcpy(result + y*plane.linesize, decoded + y*decoded_linesize, plane.linesize);\r
232                                 });\r
233                         }\r
234                         else\r
235                         {\r
236                                 fast_memcpy(result, decoded, plane.size);\r
237                         }\r
238 \r
239                         write->commit(n);\r
240                 }\r
241         }\r
242         \r
243         // Fix field-order if needed\r
244         if(write->get_type() == core::field_mode::lower && frame_factory->get_video_format_desc().field_mode == core::field_mode::upper)\r
245                 write->get_frame_transform().fill_translation[1] += 1.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
246         else if(write->get_type() == core::field_mode::upper && frame_factory->get_video_format_desc().field_mode == core::field_mode::lower)\r
247                 write->get_frame_transform().fill_translation[1] -= 1.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
248 \r
249         return make_safe_ptr(write);\r
250 }\r
251 \r
252 bool is_sane_fps(AVRational time_base)\r
253 {\r
254         double fps = static_cast<double>(time_base.den) / static_cast<double>(time_base.num);\r
255         return fps > 20.0 && fps < 65.0;\r
256 }\r
257 \r
258 void fix_meta_data(AVFormatContext& context)\r
259 {\r
260         auto video_index = av_find_best_stream(&context, AVMEDIA_TYPE_VIDEO, -1, -1, 0, 0);\r
261         auto audio_index = av_find_best_stream(&context, AVMEDIA_TYPE_AUDIO, -1, -1, 0, 0);\r
262 \r
263         if(video_index < 0)\r
264                 return;\r
265 \r
266         auto& video_context = *context.streams[video_index]->codec;\r
267         auto& video_stream  = *context.streams[video_index];\r
268                                                 \r
269         if(boost::filesystem2::path(context.filename).extension() == ".flv")\r
270         {\r
271                 try\r
272                 {\r
273                         auto meta = read_flv_meta_info(context.filename);\r
274                         double fps = boost::lexical_cast<double>(meta["framerate"]);\r
275                         video_context.time_base.num = 1000000;\r
276                         video_context.time_base.den = static_cast<int>(fps*1000000.0);\r
277                         video_stream.nb_frames = static_cast<int64_t>(boost::lexical_cast<double>(meta["duration"])*fps);\r
278                 }\r
279                 catch(...){}\r
280         }\r
281         else\r
282         {\r
283                 if(video_stream.nb_frames == 0)\r
284                         video_stream.nb_frames = video_stream.duration;\r
285 \r
286                 if(!is_sane_fps(video_context.time_base))\r
287                 {                       \r
288                         if(video_context.time_base.num == 1)\r
289                                 video_context.time_base.num = static_cast<int>(std::pow(10.0, static_cast<int>(std::log10(static_cast<float>(video_context.time_base.den)))-1));        \r
290 \r
291                         if(!is_sane_fps(video_context.time_base) && audio_index > -1)\r
292                         {\r
293                                 auto& audio_context = *context.streams[audio_index]->codec;\r
294                                 auto& audio_stream  = *context.streams[audio_index];\r
295 \r
296                                 double duration_sec = audio_stream.duration / static_cast<double>(audio_context.sample_rate);\r
297                                                                 \r
298                                 video_context.time_base.num = static_cast<int>(duration_sec*100000.0);\r
299                                 video_context.time_base.den = static_cast<int>(video_stream.nb_frames*100000);\r
300                         }\r
301                 }\r
302 \r
303                 if(audio_index > -1) // Check for invalid double frame-rate\r
304                 {\r
305                         auto& audio_context             = *context.streams[audio_index]->codec;\r
306                         auto& audio_stream              = *context.streams[audio_index];\r
307 \r
308                         double duration_sec             = audio_stream.duration / static_cast<double>(audio_context.sample_rate);\r
309                         double fps                              = static_cast<double>(video_context.time_base.den) / static_cast<double>(video_context.time_base.num);\r
310 \r
311                         double fps_nb_frames    = static_cast<double>(duration_sec*fps);\r
312                         double stream_nb_frames = static_cast<double>(video_stream.nb_frames);\r
313                         double diff                             = std::abs(fps_nb_frames - stream_nb_frames*2.0);\r
314                         if(diff < fps_nb_frames*0.05)\r
315                                 video_context.time_base.num *= 2;\r
316                 }\r
317                 else\r
318                 {\r
319                         video_context.time_base.den = video_stream.r_frame_rate.num;\r
320                         video_context.time_base.num = video_stream.r_frame_rate.den;\r
321                 }\r
322         }\r
323 \r
324         double fps = static_cast<double>(video_context.time_base.den) / static_cast<double>(video_context.time_base.num);\r
325 \r
326         double closest_fps = 0.0;\r
327         for(int n = 0; n < core::video_format::count; ++n)\r
328         {\r
329                 auto format = core::video_format_desc::get(static_cast<core::video_format::type>(n));\r
330 \r
331                 double diff1 = std::abs(format.fps - fps);\r
332                 double diff2 = std::abs(closest_fps - fps);\r
333 \r
334                 if(diff1 < diff2)\r
335                         closest_fps = format.fps;\r
336         }\r
337         \r
338         video_context.time_base.num = 1000000;\r
339         video_context.time_base.den = static_cast<int>(closest_fps*1000000.0);\r
340 }\r
341 \r
342 safe_ptr<AVPacket> create_packet()\r
343 {\r
344         safe_ptr<AVPacket> packet(new AVPacket, [](AVPacket* p)\r
345         {\r
346                 av_free_packet(p);\r
347                 delete p;\r
348         });\r
349         \r
350         av_init_packet(packet.get());\r
351         return packet;\r
352 }\r
353 \r
354 safe_ptr<AVCodecContext> open_codec(AVFormatContext& context, enum AVMediaType type, int& index)\r
355 {       \r
356         AVCodec* decoder;\r
357         index = THROW_ON_ERROR2(av_find_best_stream(&context, type, -1, -1, &decoder, 0), "");\r
358         THROW_ON_ERROR2(avcodec_open(context.streams[index]->codec, decoder), "");\r
359         return safe_ptr<AVCodecContext>(context.streams[index]->codec, avcodec_close);\r
360 }\r
361 \r
362 safe_ptr<AVFormatContext> open_input(const std::wstring& filename)\r
363 {\r
364         AVFormatContext* weak_context = nullptr;\r
365         THROW_ON_ERROR2(avformat_open_input(&weak_context, narrow(filename).c_str(), nullptr, nullptr), filename);\r
366         safe_ptr<AVFormatContext> context(weak_context, av_close_input_file);                   \r
367         THROW_ON_ERROR2(avformat_find_stream_info(weak_context, nullptr), filename);\r
368         fix_meta_data(*context);\r
369         return context;\r
370 }\r
371 //\r
372 //void av_dup_frame(AVFrame* frame)\r
373 //{\r
374 //      AVFrame* new_frame = avcodec_alloc_frame();\r
375 //\r
376 //\r
377 //      const uint8_t *src_data[4] = {0};\r
378 //      memcpy(const_cast<uint8_t**>(&src_data[0]), frame->data, 4);\r
379 //      const int src_linesizes[4] = {0};\r
380 //      memcpy(const_cast<int*>(&src_linesizes[0]), frame->linesize, 4);\r
381 //\r
382 //      av_image_alloc(new_frame->data, new_frame->linesize, new_frame->width, new_frame->height, frame->format, 16);\r
383 //\r
384 //      av_image_copy(new_frame->data, new_frame->linesize, src_data, src_linesizes, frame->format, new_frame->width, new_frame->height);\r
385 //\r
386 //      frame =\r
387 //}\r
388 \r
389 }}