]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/producer/util/util.cpp
- more gpu refactoring.
[casparcg] / modules / ffmpeg / producer / util / util.cpp
1 /*\r
2 * Copyright (c) 2011 Sveriges Television AB <info@casparcg.com>\r
3 *\r
4 * This file is part of CasparCG (www.casparcg.com).\r
5 *\r
6 * CasparCG is free software: you can redistribute it and/or modify\r
7 * it under the terms of the GNU General Public License as published by\r
8 * the Free Software Foundation, either version 3 of the License, or\r
9 * (at your option) any later version.\r
10 *\r
11 * CasparCG is distributed in the hope that it will be useful,\r
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of\r
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\r
14 * GNU General Public License for more details.\r
15 *\r
16 * You should have received a copy of the GNU General Public License\r
17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.\r
18 *\r
19 * Author: Robert Nagy, ronag89@gmail.com\r
20 */\r
21 \r
22 #include "../../stdafx.h"\r
23 \r
24 #include "util.h"\r
25 \r
26 #include "flv.h"\r
27 \r
28 #include "../tbb_avcodec.h"\r
29 #include "../../ffmpeg_error.h"\r
30 \r
31 #include <tbb/concurrent_unordered_map.h>\r
32 #include <tbb/concurrent_queue.h>\r
33 \r
34 #include <core/producer/frame/frame_transform.h>\r
35 #include <core/producer/frame/frame_factory.h>\r
36 #include <core/producer/frame_producer.h>\r
37 #include <core/mixer/device_frame.h>\r
38 \r
39 #include <common/exception/exceptions.h>\r
40 \r
41 #include <tbb/parallel_for.h>\r
42 \r
43 #include <common/assert.h>\r
44 #include <boost/filesystem.hpp>\r
45 #include <boost/lexical_cast.hpp>\r
46 \r
47 #include <asmlib.h>\r
48 \r
49 #if defined(_MSC_VER)\r
50 #pragma warning (push)\r
51 #pragma warning (disable : 4244)\r
52 #endif\r
53 extern "C" \r
54 {\r
55         #include <libswscale/swscale.h>\r
56         #include <libavcodec/avcodec.h>\r
57         #include <libavformat/avformat.h>\r
58 }\r
59 #if defined(_MSC_VER)\r
60 #pragma warning (pop)\r
61 #endif\r
62 \r
63 namespace caspar { namespace ffmpeg {\r
64                 \r
65 std::shared_ptr<core::audio_buffer> flush_audio()\r
66 {\r
67         static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());\r
68         return audio;\r
69 }\r
70 \r
71 std::shared_ptr<core::audio_buffer> empty_audio()\r
72 {\r
73         static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());\r
74         return audio;\r
75 }\r
76 \r
77 std::shared_ptr<AVFrame>                        flush_video()\r
78 {\r
79         static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);\r
80         return video;\r
81 }\r
82 \r
83 std::shared_ptr<AVFrame>                        empty_video()\r
84 {\r
85         static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);\r
86         return video;\r
87 }\r
88 \r
89 core::field_mode get_mode(const AVFrame& frame)\r
90 {\r
91         if(!frame.interlaced_frame)\r
92                 return core::field_mode::progressive;\r
93 \r
94         return frame.top_field_first ? core::field_mode::upper : core::field_mode::lower;\r
95 }\r
96 \r
97 core::pixel_format get_pixel_format(PixelFormat pix_fmt)\r
98 {\r
99         switch(pix_fmt)\r
100         {\r
101         case CASPAR_PIX_FMT_LUMA:       return core::pixel_format::luma;\r
102         case PIX_FMT_GRAY8:                     return core::pixel_format::gray;\r
103         case PIX_FMT_BGRA:                      return core::pixel_format::bgra;\r
104         case PIX_FMT_ARGB:                      return core::pixel_format::argb;\r
105         case PIX_FMT_RGBA:                      return core::pixel_format::rgba;\r
106         case PIX_FMT_ABGR:                      return core::pixel_format::abgr;\r
107         case PIX_FMT_YUV444P:           return core::pixel_format::ycbcr;\r
108         case PIX_FMT_YUV422P:           return core::pixel_format::ycbcr;\r
109         case PIX_FMT_YUV420P:           return core::pixel_format::ycbcr;\r
110         case PIX_FMT_YUV411P:           return core::pixel_format::ycbcr;\r
111         case PIX_FMT_YUV410P:           return core::pixel_format::ycbcr;\r
112         case PIX_FMT_YUVA420P:          return core::pixel_format::ycbcra;\r
113         default:                                        return core::pixel_format::invalid;\r
114         }\r
115 }\r
116 \r
117 core::pixel_format_desc get_pixel_format_desc(PixelFormat pix_fmt, int width, int height)\r
118 {\r
119         // Get linesizes\r
120         AVPicture dummy_pict;   \r
121         avpicture_fill(&dummy_pict, nullptr, pix_fmt == CASPAR_PIX_FMT_LUMA ? PIX_FMT_GRAY8 : pix_fmt, width, height);\r
122 \r
123         core::pixel_format_desc desc;\r
124         desc.pix_fmt = get_pixel_format(pix_fmt);\r
125                 \r
126         switch(desc.pix_fmt.value())\r
127         {\r
128         case core::pixel_format::gray:\r
129         case core::pixel_format::luma:\r
130                 {\r
131                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));                                               \r
132                         return desc;\r
133                 }\r
134         case core::pixel_format::bgra:\r
135         case core::pixel_format::argb:\r
136         case core::pixel_format::rgba:\r
137         case core::pixel_format::abgr:\r
138                 {\r
139                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0]/4, height, 4));                                             \r
140                         return desc;\r
141                 }\r
142         case core::pixel_format::ycbcr:\r
143         case core::pixel_format::ycbcra:\r
144                 {               \r
145                         // Find chroma height\r
146                         int size2 = static_cast<int>(dummy_pict.data[2] - dummy_pict.data[1]);\r
147                         int h2 = size2/dummy_pict.linesize[1];                  \r
148 \r
149                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));\r
150                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[1], h2, 1));\r
151                         desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[2], h2, 1));\r
152 \r
153                         if(desc.pix_fmt == core::pixel_format::ycbcra)                                          \r
154                                 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[3], height, 1));       \r
155                         return desc;\r
156                 }               \r
157         default:                \r
158                 desc.pix_fmt = core::pixel_format::invalid;\r
159                 return desc;\r
160         }\r
161 }\r
162 \r
163 int make_alpha_format(int format)\r
164 {\r
165         switch(get_pixel_format(static_cast<PixelFormat>(format)).value())\r
166         {\r
167         case core::pixel_format::ycbcr:\r
168         case core::pixel_format::ycbcra:\r
169                 return CASPAR_PIX_FMT_LUMA;\r
170         default:\r
171                 return format;\r
172         }\r
173 }\r
174 \r
175 safe_ptr<core::device_frame> make_device_frame(const void* tag, const safe_ptr<AVFrame>& decoded_frame, const safe_ptr<core::frame_factory>& frame_factory, int flags)\r
176 {                       \r
177         static tbb::concurrent_unordered_map<int, tbb::concurrent_queue<std::shared_ptr<SwsContext>>> sws_contexts_;\r
178         \r
179         if(decoded_frame->width < 1 || decoded_frame->height < 1)\r
180                 return make_safe<core::device_frame>(tag);\r
181 \r
182         const auto width  = decoded_frame->width;\r
183         const auto height = decoded_frame->height;\r
184         auto desc                 = get_pixel_format_desc(static_cast<PixelFormat>(decoded_frame->format), width, height);\r
185         \r
186         if(flags & core::frame_producer::flags::alpha_only)\r
187                 desc = get_pixel_format_desc(static_cast<PixelFormat>(make_alpha_format(decoded_frame->format)), width, height);\r
188 \r
189         std::shared_ptr<core::device_frame> write;\r
190 \r
191         if(desc.pix_fmt == core::pixel_format::invalid)\r
192         {\r
193                 auto pix_fmt = static_cast<PixelFormat>(decoded_frame->format);\r
194                 auto target_pix_fmt = PIX_FMT_BGRA;\r
195 \r
196                 if(pix_fmt == PIX_FMT_UYVY422)\r
197                         target_pix_fmt = PIX_FMT_YUV422P;\r
198                 else if(pix_fmt == PIX_FMT_YUYV422)\r
199                         target_pix_fmt = PIX_FMT_YUV422P;\r
200                 else if(pix_fmt == PIX_FMT_UYYVYY411)\r
201                         target_pix_fmt = PIX_FMT_YUV411P;\r
202                 else if(pix_fmt == PIX_FMT_YUV420P10)\r
203                         target_pix_fmt = PIX_FMT_YUV420P;\r
204                 else if(pix_fmt == PIX_FMT_YUV422P10)\r
205                         target_pix_fmt = PIX_FMT_YUV422P;\r
206                 else if(pix_fmt == PIX_FMT_YUV444P10)\r
207                         target_pix_fmt = PIX_FMT_YUV444P;\r
208                 \r
209                 auto target_desc = get_pixel_format_desc(target_pix_fmt, width, height);\r
210 \r
211                 write = frame_factory->create_frame(tag, target_desc, [&](const std::vector<boost::iterator_range<uint8_t*>>& dest)\r
212                 {\r
213                         std::shared_ptr<SwsContext> sws_context;\r
214 \r
215                         //CASPAR_LOG(warning) << "Hardware accelerated color transform not supported.";\r
216 \r
217                         int key = ((width << 22) & 0xFFC00000) | ((height << 6) & 0x003FC000) | ((pix_fmt << 7) & 0x00007F00) | ((target_pix_fmt << 0) & 0x0000007F);\r
218                         \r
219                         auto& pool = sws_contexts_[key];\r
220                                                 \r
221                         if(!pool.try_pop(sws_context))\r
222                         {\r
223                                 double param;\r
224                                 sws_context.reset(sws_getContext(width, height, pix_fmt, width, height, target_pix_fmt, SWS_BILINEAR, nullptr, nullptr, &param), sws_freeContext);\r
225                         }\r
226                         \r
227                         if(!sws_context)\r
228                         {\r
229                                 BOOST_THROW_EXCEPTION(operation_failed() << msg_info("Could not create software scaling context.") << \r
230                                                                                 boost::errinfo_api_function("sws_getContext"));\r
231                         }       \r
232                 \r
233                         safe_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);     \r
234                         avcodec_get_frame_defaults(av_frame.get());                     \r
235                         if(target_pix_fmt == PIX_FMT_BGRA)\r
236                         {\r
237                                 avpicture_fill(reinterpret_cast<AVPicture*>(av_frame.get()), dest.at(0).begin(), PIX_FMT_BGRA, width, height);\r
238                         }\r
239                         else\r
240                         {\r
241                                 av_frame->width  = width;\r
242                                 av_frame->height = height;\r
243                                 for(int n = 0; n < target_desc.planes.size(); ++n)\r
244                                 {\r
245                                         av_frame->data[n]               = dest.at(n).begin();\r
246                                         av_frame->linesize[n]   = target_desc.planes[n].linesize;\r
247                                 }\r
248                         }\r
249 \r
250                         sws_scale(sws_context.get(), decoded_frame->data, decoded_frame->linesize, 0, height, av_frame->data, av_frame->linesize);      \r
251                         pool.push(sws_context); \r
252                 }, get_mode(*decoded_frame));\r
253         }\r
254         else\r
255         {\r
256                 write = frame_factory->create_frame(tag, desc, [&](const std::vector<boost::iterator_range<uint8_t*>>& dest)\r
257                 {\r
258                         for(int n = 0; n < static_cast<int>(desc.planes.size()); ++n)\r
259                         {\r
260                                 auto plane            = desc.planes[n];\r
261                                 auto result           = dest.at(n).begin();\r
262                                 auto decoded          = decoded_frame->data[n];\r
263                                 auto decoded_linesize = decoded_frame->linesize[n];\r
264                         \r
265                                 CASPAR_ASSERT(decoded);\r
266                                 CASPAR_ASSERT(dest.at(n).begin());\r
267 \r
268                                 // Copy line by line since ffmpeg sometimes pads each line.\r
269                                 tbb::affinity_partitioner ap;\r
270                                 tbb::parallel_for(tbb::blocked_range<int>(0, desc.planes[n].height), [&](const tbb::blocked_range<int>& r)\r
271                                 {\r
272                                         for(int y = r.begin(); y != r.end(); ++y)\r
273                                                 A_memcpy(result + y*plane.linesize, decoded + y*decoded_linesize, plane.linesize);\r
274                                 }, ap);\r
275                         }\r
276                 }, get_mode(*decoded_frame));\r
277         }\r
278 \r
279         if(decoded_frame->height == 480) // NTSC DV\r
280         {\r
281                 write->get_frame_transform().fill_translation[1] += 2.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
282                 write->get_frame_transform().fill_scale[1] = 1.0 - 6.0*1.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
283         }\r
284         \r
285         // Fix field-order if needed\r
286         if(write->get_type() == core::field_mode::lower && frame_factory->get_video_format_desc().field_mode == core::field_mode::upper)\r
287                 write->get_frame_transform().fill_translation[1] += 1.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
288         else if(write->get_type() == core::field_mode::upper && frame_factory->get_video_format_desc().field_mode == core::field_mode::lower)\r
289                 write->get_frame_transform().fill_translation[1] -= 1.0/static_cast<double>(frame_factory->get_video_format_desc().height);\r
290 \r
291         return make_safe_ptr(write);\r
292 }\r
293 \r
294 bool is_sane_fps(AVRational time_base)\r
295 {\r
296         double fps = static_cast<double>(time_base.den) / static_cast<double>(time_base.num);\r
297         return fps > 20.0 && fps < 65.0;\r
298 }\r
299 \r
300 AVRational fix_time_base(AVRational time_base)\r
301 {\r
302         if(time_base.num == 1)\r
303                 time_base.num = static_cast<int>(std::pow(10.0, static_cast<int>(std::log10(static_cast<float>(time_base.den)))-1));    \r
304                         \r
305         if(!is_sane_fps(time_base))\r
306         {\r
307                 auto tmp = time_base;\r
308                 tmp.den /= 2;\r
309                 if(is_sane_fps(tmp))\r
310                         time_base = tmp;\r
311         }\r
312 \r
313         return time_base;\r
314 }\r
315 \r
316 double read_fps(AVFormatContext& context, double fail_value)\r
317 {                                               \r
318         auto video_index = av_find_best_stream(&context, AVMEDIA_TYPE_VIDEO, -1, -1, 0, 0);\r
319         auto audio_index = av_find_best_stream(&context, AVMEDIA_TYPE_AUDIO, -1, -1, 0, 0);\r
320         \r
321         if(video_index > -1)\r
322         {\r
323                 const auto video_context = context.streams[video_index]->codec;\r
324                 const auto video_stream  = context.streams[video_index];\r
325                                                 \r
326                 AVRational time_base = video_context->time_base;\r
327 \r
328                 if(boost::filesystem::path(context.filename).extension().string() == ".flv")\r
329                 {\r
330                         try\r
331                         {\r
332                                 auto meta = read_flv_meta_info(context.filename);\r
333                                 return boost::lexical_cast<double>(meta["framerate"]);\r
334                         }\r
335                         catch(...)\r
336                         {\r
337                                 return 0.0;\r
338                         }\r
339                 }\r
340                 else\r
341                 {\r
342                         time_base.num *= video_context->ticks_per_frame;\r
343 \r
344                         if(!is_sane_fps(time_base))\r
345                         {                       \r
346                                 time_base = fix_time_base(time_base);\r
347 \r
348                                 if(!is_sane_fps(time_base) && audio_index > -1)\r
349                                 {\r
350                                         auto& audio_context = *context.streams[audio_index]->codec;\r
351                                         auto& audio_stream  = *context.streams[audio_index];\r
352 \r
353                                         double duration_sec = audio_stream.duration / static_cast<double>(audio_context.sample_rate);\r
354                                                                 \r
355                                         time_base.num = static_cast<int>(duration_sec*100000.0);\r
356                                         time_base.den = static_cast<int>(video_stream->nb_frames*100000);\r
357                                 }\r
358                         }\r
359                 }\r
360                 \r
361                 double fps = static_cast<double>(time_base.den) / static_cast<double>(time_base.num);\r
362 \r
363                 double closest_fps = 0.0;\r
364                 for(int n = 0; n < core::video_format::count; ++n)\r
365                 {\r
366                         auto format = core::video_format_desc(core::video_format(n));\r
367 \r
368                         double diff1 = std::abs(format.fps - fps);\r
369                         double diff2 = std::abs(closest_fps - fps);\r
370 \r
371                         if(diff1 < diff2)\r
372                                 closest_fps = format.fps;\r
373                 }\r
374         \r
375                 return closest_fps;\r
376         }\r
377 \r
378         return fail_value;      \r
379 }\r
380 \r
381 void fix_meta_data(AVFormatContext& context)\r
382 {\r
383         auto video_index = av_find_best_stream(&context, AVMEDIA_TYPE_VIDEO, -1, -1, 0, 0);\r
384 \r
385         if(video_index > -1)\r
386         {\r
387                 auto video_stream   = context.streams[video_index];\r
388                 auto video_context  = context.streams[video_index]->codec;\r
389                                                 \r
390                 if(boost::filesystem::path(context.filename).extension().string() == ".flv")\r
391                 {\r
392                         try\r
393                         {\r
394                                 auto meta = read_flv_meta_info(context.filename);\r
395                                 double fps = boost::lexical_cast<double>(meta["framerate"]);\r
396                                 video_stream->nb_frames = static_cast<int64_t>(boost::lexical_cast<double>(meta["duration"])*fps);\r
397                         }\r
398                         catch(...){}\r
399                 }\r
400                 else\r
401                 {\r
402                         auto stream_time = video_stream->time_base;\r
403                         auto duration    = video_stream->duration;\r
404                         auto codec_time  = video_context->time_base;\r
405                         auto ticks               = video_context->ticks_per_frame;\r
406 \r
407                         if(video_stream->nb_frames == 0)\r
408                                 video_stream->nb_frames = (duration*stream_time.num*codec_time.den)/(stream_time.den*codec_time.num*ticks);     \r
409                 }\r
410         }\r
411 }\r
412 \r
413 safe_ptr<AVPacket> create_packet()\r
414 {\r
415         safe_ptr<AVPacket> packet(new AVPacket, [](AVPacket* p)\r
416         {\r
417                 av_free_packet(p);\r
418                 delete p;\r
419         });\r
420         \r
421         av_init_packet(packet.get());\r
422         return packet;\r
423 }\r
424 \r
425 safe_ptr<AVCodecContext> open_codec(AVFormatContext& context, enum AVMediaType type, int& index)\r
426 {       \r
427         AVCodec* decoder;\r
428         index = THROW_ON_ERROR2(av_find_best_stream(&context, type, -1, -1, &decoder, 0), "");\r
429         //if(strcmp(decoder->name, "prores") == 0 && decoder->next && strcmp(decoder->next->name, "prores_lgpl") == 0)\r
430         //      decoder = decoder->next;\r
431 \r
432         THROW_ON_ERROR2(tbb_avcodec_open(context.streams[index]->codec, decoder), "");\r
433         return safe_ptr<AVCodecContext>(context.streams[index]->codec, tbb_avcodec_close);\r
434 }\r
435 \r
436 safe_ptr<AVFormatContext> open_input(const std::wstring& filename)\r
437 {\r
438         AVFormatContext* weak_context = nullptr;\r
439         THROW_ON_ERROR2(avformat_open_input(&weak_context, u8(filename).c_str(), nullptr, nullptr), filename);\r
440         safe_ptr<AVFormatContext> context(weak_context, av_close_input_file);                   \r
441         THROW_ON_ERROR2(avformat_find_stream_info(weak_context, nullptr), filename);\r
442         fix_meta_data(*context);\r
443         return context;\r
444 }\r
445 \r
446 std::wstring print_mode(int width, int height, double fps, bool interlaced)\r
447 {\r
448         std::wostringstream fps_ss;\r
449         fps_ss << std::fixed << std::setprecision(2) << (!interlaced ? fps : 2.0 * fps);\r
450 \r
451         return boost::lexical_cast<std::wstring>(width) + L"x" + boost::lexical_cast<std::wstring>(height) + (!interlaced ? L"p" : L"i") + fps_ss.str();\r
452 }\r
453 \r
454 bool is_valid_file(const std::wstring filename)\r
455 {                       \r
456         if(boost::filesystem::path(filename).extension() == ".m2t")\r
457                 return true;\r
458 \r
459         std::ifstream file(filename);\r
460 \r
461         std::vector<unsigned char> buf;\r
462         for(auto file_it = std::istreambuf_iterator<char>(file); file_it != std::istreambuf_iterator<char>() && buf.size() < 2048; ++file_it)\r
463                 buf.push_back(*file_it);\r
464 \r
465         if(buf.empty())\r
466                 return nullptr;\r
467 \r
468         AVProbeData pb;\r
469         pb.filename = u8(filename).c_str();\r
470         pb.buf          = buf.data();\r
471         pb.buf_size = static_cast<int>(buf.size());\r
472 \r
473         int score = 0;\r
474         return av_probe_input_format2(&pb, true, &score) != nullptr;\r
475 }\r
476 \r
477 std::wstring probe_stem(const std::wstring stem)\r
478 {\r
479         auto stem2 = boost::filesystem::path(stem);\r
480         auto dir = stem2.parent_path();\r
481         for(auto it = boost::filesystem::directory_iterator(dir); it != boost::filesystem::directory_iterator(); ++it)\r
482         {\r
483                 if(boost::iequals(it->path().stem().wstring(), stem2.filename().wstring()) && is_valid_file(it->path().wstring()))\r
484                         return it->path().wstring();\r
485         }\r
486         return L"";\r
487 }\r
488 //\r
489 //void av_dup_frame(AVFrame* frame)\r
490 //{\r
491 //      AVFrame* new_frame = avcodec_alloc_frame();\r
492 //\r
493 //\r
494 //      const uint8_t *src_data[4] = {0};\r
495 //      memcpy(const_cast<uint8_t**>(&src_data[0]), frame->data, 4);\r
496 //      const int src_linesizes[4] = {0};\r
497 //      memcpy(const_cast<int*>(&src_linesizes[0]), frame->linesize, 4);\r
498 //\r
499 //      av_image_alloc(new_frame->data, new_frame->linesize, new_frame->width, new_frame->height, frame->format, 16);\r
500 //\r
501 //      av_image_copy(new_frame->data, new_frame->linesize, src_data, src_linesizes, frame->format, new_frame->width, new_frame->height);\r
502 //\r
503 //      frame =\r
504 //}\r
505 \r
506 }}