2 * Copyright (c) 2011 Sveriges Television AB <info@casparcg.com>
\r
4 * This file is part of CasparCG (www.casparcg.com).
\r
6 * CasparCG is free software: you can redistribute it and/or modify
\r
7 * it under the terms of the GNU General Public License as published by
\r
8 * the Free Software Foundation, either version 3 of the License, or
\r
9 * (at your option) any later version.
\r
11 * CasparCG is distributed in the hope that it will be useful,
\r
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
14 * GNU General Public License for more details.
\r
16 * You should have received a copy of the GNU General Public License
\r
17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.
\r
19 * Author: Robert Nagy, ronag89@gmail.com
\r
22 #include "../../stdafx.h"
\r
28 #include "../tbb_avcodec.h"
\r
29 #include "../../ffmpeg_error.h"
\r
31 #include <tbb/concurrent_unordered_map.h>
\r
32 #include <tbb/concurrent_queue.h>
\r
34 #include <core/frame/frame_transform.h>
\r
35 #include <core/frame/frame_factory.h>
\r
36 #include <core/producer/frame_producer.h>
\r
37 #include <core/frame/write_frame.h>
\r
39 #include <common/except.h>
\r
41 #include <tbb/parallel_for.h>
\r
43 #include <common/assert.h>
\r
44 #include <boost/filesystem.hpp>
\r
45 #include <boost/lexical_cast.hpp>
\r
49 #if defined(_MSC_VER)
\r
50 #pragma warning (push)
\r
51 #pragma warning (disable : 4244)
\r
55 #include <libswscale/swscale.h>
\r
56 #include <libavcodec/avcodec.h>
\r
57 #include <libavformat/avformat.h>
\r
59 #if defined(_MSC_VER)
\r
60 #pragma warning (pop)
\r
63 namespace caspar { namespace ffmpeg {
\r
65 std::shared_ptr<core::audio_buffer> flush_audio()
\r
67 static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());
\r
71 std::shared_ptr<core::audio_buffer> empty_audio()
\r
73 static std::shared_ptr<core::audio_buffer> audio(new core::audio_buffer());
\r
77 std::shared_ptr<AVFrame> flush_video()
\r
79 static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);
\r
83 std::shared_ptr<AVFrame> empty_video()
\r
85 static std::shared_ptr<AVFrame> video(avcodec_alloc_frame(), av_free);
\r
89 core::field_mode get_mode(const AVFrame& frame)
\r
91 if(!frame.interlaced_frame)
\r
92 return core::field_mode::progressive;
\r
94 return frame.top_field_first ? core::field_mode::upper : core::field_mode::lower;
\r
97 core::pixel_format get_pixel_format(PixelFormat pix_fmt)
\r
101 case CASPAR_PIX_FMT_LUMA: return core::pixel_format::luma;
\r
102 case PIX_FMT_GRAY8: return core::pixel_format::gray;
\r
103 case PIX_FMT_BGRA: return core::pixel_format::bgra;
\r
104 case PIX_FMT_ARGB: return core::pixel_format::argb;
\r
105 case PIX_FMT_RGBA: return core::pixel_format::rgba;
\r
106 case PIX_FMT_ABGR: return core::pixel_format::abgr;
\r
107 case PIX_FMT_YUV444P: return core::pixel_format::ycbcr;
\r
108 case PIX_FMT_YUV422P: return core::pixel_format::ycbcr;
\r
109 case PIX_FMT_YUV420P: return core::pixel_format::ycbcr;
\r
110 case PIX_FMT_YUV411P: return core::pixel_format::ycbcr;
\r
111 case PIX_FMT_YUV410P: return core::pixel_format::ycbcr;
\r
112 case PIX_FMT_YUVA420P: return core::pixel_format::ycbcra;
\r
113 default: return core::pixel_format::invalid;
\r
117 core::pixel_format_desc pixel_format_desc(PixelFormat pix_fmt, int width, int height)
\r
120 AVPicture dummy_pict;
\r
121 avpicture_fill(&dummy_pict, nullptr, pix_fmt == CASPAR_PIX_FMT_LUMA ? PIX_FMT_GRAY8 : pix_fmt, width, height);
\r
123 core::pixel_format_desc desc = get_pixel_format(pix_fmt);
\r
125 switch(desc.format.value())
\r
127 case core::pixel_format::gray:
\r
128 case core::pixel_format::luma:
\r
130 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));
\r
133 case core::pixel_format::bgra:
\r
134 case core::pixel_format::argb:
\r
135 case core::pixel_format::rgba:
\r
136 case core::pixel_format::abgr:
\r
138 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0]/4, height, 4));
\r
141 case core::pixel_format::ycbcr:
\r
142 case core::pixel_format::ycbcra:
\r
144 // Find chroma height
\r
145 int size2 = static_cast<int>(dummy_pict.data[2] - dummy_pict.data[1]);
\r
146 int h2 = size2/dummy_pict.linesize[1];
\r
148 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));
\r
149 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[1], h2, 1));
\r
150 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[2], h2, 1));
\r
152 if(desc.format == core::pixel_format::ycbcra)
\r
153 desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[3], height, 1));
\r
157 desc.format = core::pixel_format::invalid;
\r
162 int make_alpha_format(int format)
\r
164 switch(get_pixel_format(static_cast<PixelFormat>(format)).value())
\r
166 case core::pixel_format::ycbcr:
\r
167 case core::pixel_format::ycbcra:
\r
168 return CASPAR_PIX_FMT_LUMA;
\r
174 spl::shared_ptr<core::write_frame> make_write_frame(const void* tag, const spl::shared_ptr<AVFrame>& decoded_frame, double fps, const spl::shared_ptr<core::frame_factory>& frame_factory, int flags)
\r
176 static tbb::concurrent_unordered_map<int, tbb::concurrent_queue<std::shared_ptr<SwsContext>>> sws_contexts_;
\r
178 if(decoded_frame->width < 1 || decoded_frame->height < 1)
\r
179 return frame_factory->create_frame(tag, core::pixel_format_desc(core::pixel_format::invalid));
\r
181 const auto width = decoded_frame->width;
\r
182 const auto height = decoded_frame->height;
\r
183 auto desc = pixel_format_desc(static_cast<PixelFormat>(decoded_frame->format), width, height);
\r
185 if(flags & core::frame_producer::flags::alpha_only)
\r
186 desc = pixel_format_desc(static_cast<PixelFormat>(make_alpha_format(decoded_frame->format)), width, height);
\r
188 std::shared_ptr<core::write_frame> write;
\r
190 if(desc.format == core::pixel_format::invalid)
\r
192 auto pix_fmt = static_cast<PixelFormat>(decoded_frame->format);
\r
193 auto target_pix_fmt = PIX_FMT_BGRA;
\r
195 if(pix_fmt == PIX_FMT_UYVY422)
\r
196 target_pix_fmt = PIX_FMT_YUV422P;
\r
197 else if(pix_fmt == PIX_FMT_YUYV422)
\r
198 target_pix_fmt = PIX_FMT_YUV422P;
\r
199 else if(pix_fmt == PIX_FMT_UYYVYY411)
\r
200 target_pix_fmt = PIX_FMT_YUV411P;
\r
201 else if(pix_fmt == PIX_FMT_YUV420P10)
\r
202 target_pix_fmt = PIX_FMT_YUV420P;
\r
203 else if(pix_fmt == PIX_FMT_YUV422P10)
\r
204 target_pix_fmt = PIX_FMT_YUV422P;
\r
205 else if(pix_fmt == PIX_FMT_YUV444P10)
\r
206 target_pix_fmt = PIX_FMT_YUV444P;
\r
208 auto target_desc = pixel_format_desc(target_pix_fmt, width, height);
\r
210 write = frame_factory->create_frame(tag, target_desc, fps, get_mode(*decoded_frame));
\r
212 std::shared_ptr<SwsContext> sws_context;
\r
214 //CASPAR_LOG(warning) << "Hardware accelerated color transform not supported.";
\r
216 int key = ((width << 22) & 0xFFC00000) | ((height << 6) & 0x003FC000) | ((pix_fmt << 7) & 0x00007F00) | ((target_pix_fmt << 0) & 0x0000007F);
\r
218 auto& pool = sws_contexts_[key];
\r
220 if(!pool.try_pop(sws_context))
\r
223 sws_context.reset(sws_getContext(width, height, pix_fmt, width, height, target_pix_fmt, SWS_BILINEAR, nullptr, nullptr, ¶m), sws_freeContext);
\r
228 BOOST_THROW_EXCEPTION(operation_failed() << msg_info("Could not create software scaling context.") <<
\r
229 boost::errinfo_api_function("sws_getContext"));
\r
232 spl::shared_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);
\r
233 avcodec_get_frame_defaults(av_frame.get());
\r
234 if(target_pix_fmt == PIX_FMT_BGRA)
\r
236 auto size = avpicture_fill(reinterpret_cast<AVPicture*>(av_frame.get()), write->image_data(0).begin(), PIX_FMT_BGRA, width, height);
\r
237 CASPAR_VERIFY(size == write->image_data(0).size());
\r
241 av_frame->width = width;
\r
242 av_frame->height = height;
\r
243 for(int n = 0; n < target_desc.planes.size(); ++n)
\r
245 av_frame->data[n] = write->image_data(n).begin();
\r
246 av_frame->linesize[n] = target_desc.planes[n].linesize;
\r
250 sws_scale(sws_context.get(), decoded_frame->data, decoded_frame->linesize, 0, height, av_frame->data, av_frame->linesize);
\r
251 pool.push(sws_context);
\r
255 write = frame_factory->create_frame(tag, desc, fps, get_mode(*decoded_frame));
\r
257 for(int n = 0; n < static_cast<int>(desc.planes.size()); ++n)
\r
259 auto plane = desc.planes[n];
\r
260 auto result = write->image_data(n).begin();
\r
261 auto decoded = decoded_frame->data[n];
\r
262 auto decoded_linesize = decoded_frame->linesize[n];
\r
264 CASPAR_ASSERT(decoded);
\r
265 CASPAR_ASSERT(write->image_data(n).begin());
\r
267 // Copy line by line since ffmpeg sometimes pads each line.
\r
268 tbb::affinity_partitioner ap;
\r
269 tbb::parallel_for(tbb::blocked_range<int>(0, desc.planes[n].height), [&](const tbb::blocked_range<int>& r)
\r
271 for(int y = r.begin(); y != r.end(); ++y)
\r
272 A_memcpy(result + y*plane.linesize, decoded + y*decoded_linesize, plane.linesize);
\r
277 if(decoded_frame->height == 480) // NTSC DV
\r
279 write->frame_transform().image_transform.fill_translation[1] += 2.0/static_cast<double>(frame_factory->video_format_desc().height);
\r
280 write->frame_transform().image_transform.fill_scale[1] = 1.0 - 6.0*1.0/static_cast<double>(frame_factory->video_format_desc().height);
\r
283 // Fix field-order if needed
\r
284 if(get_mode(*decoded_frame) == core::field_mode::lower && frame_factory->video_format_desc().field_mode == core::field_mode::upper)
\r
285 write->frame_transform().image_transform.fill_translation[1] += 1.0/static_cast<double>(frame_factory->video_format_desc().height);
\r
286 else if(get_mode(*decoded_frame) == core::field_mode::upper && frame_factory->video_format_desc().field_mode == core::field_mode::lower)
\r
287 write->frame_transform().image_transform.fill_translation[1] -= 1.0/static_cast<double>(frame_factory->video_format_desc().height);
\r
289 return spl::make_shared_ptr(write);
\r
292 spl::shared_ptr<AVFrame> make_av_frame(caspar::core::data_frame& frame)
\r
294 std::array<void*, 4> data = {};
\r
295 for(int n = 0; n < frame.pixel_format_desc().planes.size(); ++n)
\r
296 data[n] = frame.image_data(n).begin();
\r
298 return make_av_frame(data, frame.pixel_format_desc());
\r
301 spl::shared_ptr<AVFrame> make_av_frame(std::array<void*, 4> data, const core::pixel_format_desc& pix_desc)
\r
303 spl::shared_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);
\r
304 avcodec_get_frame_defaults(av_frame.get());
\r
306 auto planes = pix_desc.planes;
\r
307 auto format = pix_desc.format.value();
\r
309 av_frame->width = planes[0].width;
\r
310 av_frame->height = planes[0].height;
\r
311 for(int n = 0; n < planes.size(); ++n)
\r
313 av_frame->data[n] = reinterpret_cast<uint8_t*>(data[n]);
\r
314 av_frame->linesize[n] = planes[n].linesize;
\r
318 case core::pixel_format::rgba:
\r
319 av_frame->format = PIX_FMT_RGBA;
\r
321 case core::pixel_format::argb:
\r
322 av_frame->format = PIX_FMT_ARGB;
\r
324 case core::pixel_format::bgra:
\r
325 av_frame->format = PIX_FMT_BGRA;
\r
327 case core::pixel_format::abgr:
\r
328 av_frame->format = PIX_FMT_ABGR;
\r
330 case core::pixel_format::gray:
\r
331 av_frame->format = PIX_FMT_GRAY8;
\r
333 case core::pixel_format::ycbcr:
\r
335 int y_w = planes[0].width;
\r
336 int y_h = planes[0].height;
\r
337 int c_w = planes[1].width;
\r
338 int c_h = planes[1].height;
\r
340 if(c_h == y_h && c_w == y_w)
\r
341 av_frame->format = PIX_FMT_YUV444P;
\r
342 else if(c_h == y_h && c_w*2 == y_w)
\r
343 av_frame->format = PIX_FMT_YUV422P;
\r
344 else if(c_h == y_h && c_w*4 == y_w)
\r
345 av_frame->format = PIX_FMT_YUV411P;
\r
346 else if(c_h*2 == y_h && c_w*2 == y_w)
\r
347 av_frame->format = PIX_FMT_YUV420P;
\r
348 else if(c_h*2 == y_h && c_w*4 == y_w)
\r
349 av_frame->format = PIX_FMT_YUV410P;
\r
353 case core::pixel_format::ycbcra:
\r
354 av_frame->format = PIX_FMT_YUVA420P;
\r
360 bool is_sane_fps(AVRational time_base)
\r
362 double fps = static_cast<double>(time_base.den) / static_cast<double>(time_base.num);
\r
363 return fps > 20.0 && fps < 65.0;
\r
366 AVRational fix_time_base(AVRational time_base)
\r
368 if(time_base.num == 1)
\r
369 time_base.num = static_cast<int>(std::pow(10.0, static_cast<int>(std::log10(static_cast<float>(time_base.den)))-1));
\r
371 if(!is_sane_fps(time_base))
\r
373 auto tmp = time_base;
\r
375 if(is_sane_fps(tmp))
\r
382 double read_fps(AVFormatContext& context, double fail_value)
\r
384 auto video_index = av_find_best_stream(&context, AVMEDIA_TYPE_VIDEO, -1, -1, 0, 0);
\r
385 auto audio_index = av_find_best_stream(&context, AVMEDIA_TYPE_AUDIO, -1, -1, 0, 0);
\r
387 if(video_index > -1)
\r
389 const auto video_context = context.streams[video_index]->codec;
\r
390 const auto video_stream = context.streams[video_index];
\r
392 AVRational time_base = video_context->time_base;
\r
394 if(boost::filesystem::path(context.filename).extension().string() == ".flv")
\r
398 auto meta = read_flv_meta_info(context.filename);
\r
399 return boost::lexical_cast<double>(meta["framerate"]);
\r
408 time_base.num *= video_context->ticks_per_frame;
\r
410 if(!is_sane_fps(time_base))
\r
412 time_base = fix_time_base(time_base);
\r
414 if(!is_sane_fps(time_base) && audio_index > -1)
\r
416 auto& audio_context = *context.streams[audio_index]->codec;
\r
417 auto& audio_stream = *context.streams[audio_index];
\r
419 double duration_sec = audio_stream.duration / static_cast<double>(audio_context.sample_rate);
\r
421 time_base.num = static_cast<int>(duration_sec*100000.0);
\r
422 time_base.den = static_cast<int>(video_stream->nb_frames*100000);
\r
427 double fps = static_cast<double>(time_base.den) / static_cast<double>(time_base.num);
\r
429 double closest_fps = 0.0;
\r
430 for(int n = 0; n < core::video_format::count; ++n)
\r
432 auto format = core::video_format_desc(core::video_format(n));
\r
434 double diff1 = std::abs(format.fps - fps);
\r
435 double diff2 = std::abs(closest_fps - fps);
\r
438 closest_fps = format.fps;
\r
441 return closest_fps;
\r
444 return fail_value;
\r
447 void fix_meta_data(AVFormatContext& context)
\r
449 auto video_index = av_find_best_stream(&context, AVMEDIA_TYPE_VIDEO, -1, -1, 0, 0);
\r
451 if(video_index > -1)
\r
453 auto video_stream = context.streams[video_index];
\r
454 auto video_context = context.streams[video_index]->codec;
\r
456 if(boost::filesystem::path(context.filename).extension().string() == ".flv")
\r
460 auto meta = read_flv_meta_info(context.filename);
\r
461 double fps = boost::lexical_cast<double>(meta["framerate"]);
\r
462 video_stream->nb_frames = static_cast<int64_t>(boost::lexical_cast<double>(meta["duration"])*fps);
\r
468 auto stream_time = video_stream->time_base;
\r
469 auto duration = video_stream->duration;
\r
470 auto codec_time = video_context->time_base;
\r
471 auto ticks = video_context->ticks_per_frame;
\r
473 if(video_stream->nb_frames == 0)
\r
474 video_stream->nb_frames = (duration*stream_time.num*codec_time.den)/(stream_time.den*codec_time.num*ticks);
\r
479 spl::shared_ptr<AVPacket> create_packet()
\r
481 spl::shared_ptr<AVPacket> packet(new AVPacket, [](AVPacket* p)
\r
487 av_init_packet(packet.get());
\r
491 spl::shared_ptr<AVCodecContext> open_codec(AVFormatContext& context, enum AVMediaType type, int& index)
\r
494 index = THROW_ON_ERROR2(av_find_best_stream(&context, type, -1, -1, &decoder, 0), "");
\r
495 //if(strcmp(decoder->name, "prores") == 0 && decoder->next && strcmp(decoder->next->name, "prores_lgpl") == 0)
\r
496 // decoder = decoder->next;
\r
498 THROW_ON_ERROR2(tbb_avcodec_open(context.streams[index]->codec, decoder), "");
\r
499 return spl::shared_ptr<AVCodecContext>(context.streams[index]->codec, tbb_avcodec_close);
\r
502 spl::shared_ptr<AVFormatContext> open_input(const std::wstring& filename)
\r
504 AVFormatContext* weak_context = nullptr;
\r
505 THROW_ON_ERROR2(avformat_open_input(&weak_context, u8(filename).c_str(), nullptr, nullptr), filename);
\r
506 spl::shared_ptr<AVFormatContext> context(weak_context, av_close_input_file);
\r
507 THROW_ON_ERROR2(avformat_find_stream_info(weak_context, nullptr), filename);
\r
508 fix_meta_data(*context);
\r
512 std::wstring print_mode(int width, int height, double fps, bool interlaced)
\r
514 std::wostringstream fps_ss;
\r
515 fps_ss << std::fixed << std::setprecision(2) << (!interlaced ? fps : 2.0 * fps);
\r
517 return boost::lexical_cast<std::wstring>(width) + L"x" + boost::lexical_cast<std::wstring>(height) + (!interlaced ? L"p" : L"i") + fps_ss.str();
\r
520 bool is_valid_file(const std::wstring filename)
\r
522 if(boost::filesystem::path(filename).extension() == ".m2t")
\r
525 std::ifstream file(filename);
\r
527 std::vector<unsigned char> buf;
\r
528 for(auto file_it = std::istreambuf_iterator<char>(file); file_it != std::istreambuf_iterator<char>() && buf.size() < 2048; ++file_it)
\r
529 buf.push_back(*file_it);
\r
535 pb.filename = u8(filename).c_str();
\r
536 pb.buf = buf.data();
\r
537 pb.buf_size = static_cast<int>(buf.size());
\r
540 return av_probe_input_format2(&pb, true, &score) != nullptr;
\r
543 std::wstring probe_stem(const std::wstring stem)
\r
545 auto stem2 = boost::filesystem::path(stem);
\r
546 auto dir = stem2.parent_path();
\r
547 for(auto it = boost::filesystem::directory_iterator(dir); it != boost::filesystem::directory_iterator(); ++it)
\r
549 if(boost::iequals(it->path().stem().wstring(), stem2.filename().wstring()) && is_valid_file(it->path().wstring()))
\r
550 return it->path().wstring();
\r
555 //void av_dup_frame(AVFrame* frame)
\r
557 // AVFrame* new_frame = avcodec_alloc_frame();
\r
560 // const uint8_t *src_data[4] = {0};
\r
561 // memcpy(const_cast<uint8_t**>(&src_data[0]), frame->data, 4);
\r
562 // const int src_linesizes[4] = {0};
\r
563 // memcpy(const_cast<int*>(&src_linesizes[0]), frame->linesize, 4);
\r
565 // av_image_alloc(new_frame->data, new_frame->linesize, new_frame->width, new_frame->height, frame->format, 16);
\r
567 // av_image_copy(new_frame->data, new_frame->linesize, src_data, src_linesizes, frame->format, new_frame->width, new_frame->height);
\r