]> git.sesse.net Git - casparcg/blob - modules/ffmpeg/consumer/ffmpeg_consumer.cpp
1213b7d7bd688326d053ef1c47789801bfb46504
[casparcg] / modules / ffmpeg / consumer / ffmpeg_consumer.cpp
1 /*\r
2 * Copyright (c) 2011 Sveriges Television AB <info@casparcg.com>\r
3 *\r
4 * This file is part of CasparCG (www.casparcg.com).\r
5 *\r
6 * CasparCG is free software: you can redistribute it and/or modify\r
7 * it under the terms of the GNU General Public License as published by\r
8 * the Free Software Foundation, either version 3 of the License, or\r
9 * (at your option) any later version.\r
10 *\r
11 * CasparCG is distributed in the hope that it will be useful,\r
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of\r
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\r
14 * GNU General Public License for more details.\r
15 *\r
16 * You should have received a copy of the GNU General Public License\r
17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.\r
18 *\r
19 * Author: Robert Nagy, ronag89@gmail.com\r
20 */\r
21  \r
22 #include "../StdAfx.h"\r
23 \r
24 #include "../ffmpeg_error.h"\r
25 \r
26 #include "ffmpeg_consumer.h"\r
27 \r
28 #include "../producer/audio/audio_resampler.h"\r
29 \r
30 #include <core/mixer/read_frame.h>\r
31 #include <core/mixer/audio/audio_util.h>\r
32 #include <core/consumer/frame_consumer.h>\r
33 #include <core/video_format.h>\r
34 \r
35 #include <common/concurrency/executor.h>\r
36 #include <common/diagnostics/graph.h>\r
37 #include <common/env.h>\r
38 #include <common/utility/string.h>\r
39 #include <common/utility/param.h>\r
40 \r
41 #include <boost/algorithm/string.hpp>\r
42 #include <boost/timer.hpp>\r
43 #include <boost/property_tree/ptree.hpp>\r
44 \r
45 #include <tbb/cache_aligned_allocator.h>\r
46 #include <tbb/parallel_invoke.h>\r
47 \r
48 #include <boost/range/algorithm.hpp>\r
49 #include <boost/range/algorithm_ext.hpp>\r
50 #include <boost/lexical_cast.hpp>\r
51 \r
52 #include <string>\r
53 \r
54 #if defined(_MSC_VER)\r
55 #pragma warning (push)\r
56 #pragma warning (disable : 4244)\r
57 #endif\r
58 extern "C" \r
59 {\r
60         #define __STDC_CONSTANT_MACROS\r
61         #define __STDC_LIMIT_MACROS\r
62         #include <libavformat/avformat.h>\r
63         #include <libswscale/swscale.h>\r
64         #include <libavutil/opt.h>\r
65         #include <libavutil/pixdesc.h>\r
66         #include <libavutil/parseutils.h>\r
67 }\r
68 #if defined(_MSC_VER)\r
69 #pragma warning (pop)\r
70 #endif\r
71 \r
72 namespace caspar { namespace ffmpeg {\r
73         \r
74 int av_opt_set(void *obj, const char *name, const char *val, int search_flags)\r
75 {\r
76         AVClass* av_class = *(AVClass**)obj;\r
77 \r
78         if((strcmp(name, "pix_fmt") == 0 || strcmp(name, "pixel_format") == 0) && strcmp(av_class->class_name, "AVCodecContext") == 0)\r
79         {\r
80                 AVCodecContext* c = (AVCodecContext*)obj;               \r
81                 auto pix_fmt = av_get_pix_fmt(val);\r
82                 if(pix_fmt == PIX_FMT_NONE)\r
83                         return -1;              \r
84                 c->pix_fmt = pix_fmt;\r
85                 return 0;\r
86         }\r
87         if((strcmp(name, "r") == 0 || strcmp(name, "frame_rate") == 0) && strcmp(av_class->class_name, "AVCodecContext") == 0)\r
88         {\r
89                 AVCodecContext* c = (AVCodecContext*)obj;       \r
90 \r
91                 if(c->codec_type != AVMEDIA_TYPE_VIDEO)\r
92                         return -1;\r
93 \r
94                 AVRational rate;\r
95                 int ret = av_parse_video_rate(&rate, val);\r
96                 if(ret < 0)\r
97                         return ret;\r
98 \r
99                 c->time_base.num = rate.den;\r
100                 c->time_base.den = rate.num;\r
101                 return 0;\r
102         }\r
103 \r
104         return ::av_opt_set(obj, name, val, search_flags);\r
105 }\r
106 \r
107 struct option\r
108 {\r
109         std::string name;\r
110         std::string value;\r
111 \r
112         option(std::string name, std::string value)\r
113                 : name(std::move(name))\r
114                 , value(std::move(value))\r
115         {\r
116         }\r
117 };\r
118         \r
119 struct output_format\r
120 {\r
121         AVOutputFormat* format;\r
122         int                             width;\r
123         int                             height;\r
124         CodecID                 vcodec;\r
125         CodecID                 acodec;\r
126 \r
127         output_format(const core::video_format_desc& format_desc, const std::string& filename, std::vector<option>& options)\r
128                 : format(av_guess_format(nullptr, filename.c_str(), nullptr))\r
129                 , width(format_desc.width)\r
130                 , height(format_desc.height)\r
131                 , vcodec(CODEC_ID_NONE)\r
132                 , acodec(CODEC_ID_NONE)\r
133         {\r
134                 boost::range::remove_erase_if(options, [&](const option& o)\r
135                 {\r
136                         return set_opt(o.name, o.value);\r
137                 });\r
138                 \r
139                 if(vcodec == CODEC_ID_NONE)\r
140                         vcodec = format->video_codec;\r
141 \r
142                 if(acodec == CODEC_ID_NONE)\r
143                         acodec = format->audio_codec;\r
144                 \r
145                 if(vcodec == CODEC_ID_NONE)\r
146                         vcodec = CODEC_ID_H264;\r
147                 \r
148                 if(acodec == CODEC_ID_NONE)\r
149                         acodec = CODEC_ID_PCM_S16LE;\r
150         }\r
151         \r
152         bool set_opt(const std::string& name, const std::string& value)\r
153         {\r
154                 //if(name == "target")\r
155                 //{ \r
156                 //      enum { PAL, NTSC, FILM, UNKNOWN } norm = UNKNOWN;\r
157                 //      \r
158                 //      if(name.find("pal-") != std::string::npos)\r
159                 //              norm = PAL;\r
160                 //      else if(name.find("ntsc-") != std::string::npos)\r
161                 //              norm = NTSC;\r
162 \r
163                 //      if(norm == UNKNOWN)\r
164                 //              BOOST_THROW_EXCEPTION(invalid_argument() << arg_name_info("target"));\r
165                 //      \r
166                 //      if (name.find("-dv") != std::string::npos) \r
167                 //      {\r
168                 //              set_opt("f", "dv");\r
169                 //              set_opt("s", norm == PAL ? "720x576" : "720x480");\r
170                 //              //set_opt("pix_fmt", name.find("-dv50") != std::string::npos ? "yuv422p" : norm == PAL ? "yuv420p" : "yuv411p");\r
171                 //              //set_opt("ar", "48000");\r
172                 //              //set_opt("ac", "2");\r
173                 //      } \r
174                 //}\r
175                 if(name == "f")\r
176                 {\r
177                         format = av_guess_format(value.c_str(), nullptr, nullptr);\r
178 \r
179                         if(format == nullptr)\r
180                                 BOOST_THROW_EXCEPTION(invalid_argument() << arg_name_info("f"));\r
181 \r
182                         return true;\r
183                 }\r
184                 else if(name == "vcodec")\r
185                 {\r
186                         auto c = avcodec_find_encoder_by_name(value.c_str());\r
187                         if(c == nullptr)\r
188                                 BOOST_THROW_EXCEPTION(invalid_argument() << arg_name_info("vcodec"));\r
189 \r
190                         vcodec = avcodec_find_encoder_by_name(value.c_str())->id;\r
191                         return true;\r
192 \r
193                 }\r
194                 else if(name == "acodec")\r
195                 {\r
196                         auto c = avcodec_find_encoder_by_name(value.c_str());\r
197                         if(c == nullptr)\r
198                                 BOOST_THROW_EXCEPTION(invalid_argument() << arg_name_info("acodec"));\r
199 \r
200                         acodec = avcodec_find_encoder_by_name(value.c_str())->id;\r
201 \r
202                         return true;\r
203                 }\r
204                 else if(name == "s")\r
205                 {\r
206                         if(av_parse_video_size(&width, &height, value.c_str()) < 0)\r
207                                 BOOST_THROW_EXCEPTION(invalid_argument() << arg_name_info("s"));\r
208                         \r
209                         return true;\r
210                 }\r
211 \r
212                 return false;\r
213         }\r
214 };\r
215 \r
216 typedef std::vector<uint8_t, tbb::cache_aligned_allocator<uint8_t>>     byte_vector;\r
217 \r
218 struct ffmpeg_consumer : boost::noncopyable\r
219 {               \r
220         const std::string                                               filename_;\r
221                 \r
222         const std::shared_ptr<AVFormatContext>  oc_;\r
223         const core::video_format_desc                   format_desc_;\r
224         \r
225         const safe_ptr<diagnostics::graph>              graph_;\r
226 \r
227         executor                                                                encode_executor_;\r
228         \r
229         std::shared_ptr<AVStream>                               audio_st_;\r
230         std::shared_ptr<AVStream>                               video_st_;\r
231         \r
232         byte_vector                                                             audio_outbuf_;\r
233         byte_vector                                                             audio_buf_;\r
234         byte_vector                                                             video_outbuf_;\r
235         byte_vector                                                             picture_buf_;\r
236         std::shared_ptr<audio_resampler>                swr_;\r
237         std::shared_ptr<SwsContext>                             sws_;\r
238 \r
239         int64_t                                                                 in_frame_number_;\r
240         int64_t                                                                 out_frame_number_;\r
241 \r
242         output_format                                                   output_format_;\r
243         \r
244 public:\r
245         ffmpeg_consumer(const std::string& filename, const core::video_format_desc& format_desc, std::vector<option> options)\r
246                 : filename_(filename)\r
247                 , video_outbuf_(1920*1080*8)\r
248                 , audio_outbuf_(10000)\r
249                 , oc_(avformat_alloc_context(), av_free)\r
250                 , format_desc_(format_desc)\r
251                 , encode_executor_(print())\r
252                 , in_frame_number_(0)\r
253                 , out_frame_number_(0)\r
254                 , output_format_(format_desc, filename, options)\r
255         {\r
256                 // TODO: Ask stakeholders about case where file already exists.\r
257                 boost::filesystem2::remove(boost::filesystem2::wpath(env::media_folder() + widen(filename))); // Delete the file if it exists\r
258 \r
259                 graph_->set_color("frame-time", diagnostics::color(0.1f, 1.0f, 0.1f));\r
260                 graph_->set_text(print());\r
261                 diagnostics::register_graph(graph_);\r
262 \r
263                 encode_executor_.set_capacity(8);\r
264 \r
265                 oc_->oformat = output_format_.format;\r
266                                 \r
267                 THROW_ON_ERROR2(av_set_parameters(oc_.get(), nullptr), "[ffmpeg_consumer]");\r
268 \r
269                 strcpy_s(oc_->filename, filename_.c_str());\r
270                 \r
271                 //  Add the audio and video streams using the default format codecs     and initialize the codecs.\r
272                 auto options2 = options;\r
273                 video_st_ = add_video_stream(options2);\r
274                 audio_st_ = add_audio_stream(options);\r
275                                 \r
276                 dump_format(oc_.get(), 0, filename_.c_str(), 1);\r
277                  \r
278                 // Open the output ffmpeg, if needed.\r
279                 if (!(oc_->oformat->flags & AVFMT_NOFILE)) \r
280                         THROW_ON_ERROR2(avio_open(&oc_->pb, filename_.c_str(), URL_WRONLY), "[ffmpeg_consumer]");\r
281                                 \r
282                 THROW_ON_ERROR2(av_write_header(oc_.get()), "[ffmpeg_consumer]");\r
283 \r
284                 if(options.size() > 0)\r
285                 {\r
286                         BOOST_FOREACH(auto& option, options)\r
287                                 CASPAR_LOG(warning) << L"Invalid option: -" << widen(option.name) << L" " << widen(option.value);\r
288                 }\r
289 \r
290                 CASPAR_LOG(info) << print() << L" Successfully Initialized.";   \r
291         }\r
292 \r
293         ~ffmpeg_consumer()\r
294         {    \r
295                 encode_executor_.stop();\r
296                 encode_executor_.join();\r
297                 \r
298                 LOG_ON_ERROR2(av_write_trailer(oc_.get()), "[ffmpeg_consumer]");\r
299                 \r
300                 audio_st_.reset();\r
301                 video_st_.reset();\r
302                           \r
303                 if (!(oc_->oformat->flags & AVFMT_NOFILE)) \r
304                         LOG_ON_ERROR2(avio_close(oc_->pb), "[ffmpeg_consumer]"); // Close the output ffmpeg.\r
305 \r
306                 CASPAR_LOG(info) << print() << L" Successfully Uninitialized."; \r
307         }\r
308                         \r
309         std::wstring print() const\r
310         {\r
311                 return L"ffmpeg[" + widen(filename_) + L"]";\r
312         }\r
313 \r
314         std::shared_ptr<AVStream> add_video_stream(std::vector<option>& options)\r
315         { \r
316                 if(output_format_.vcodec == CODEC_ID_NONE)\r
317                         return nullptr;\r
318 \r
319                 auto st = av_new_stream(oc_.get(), 0);\r
320                 if (!st)                \r
321                         BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("Could not allocate video-stream.") << boost::errinfo_api_function("av_new_stream"));              \r
322 \r
323                 auto encoder = avcodec_find_encoder(output_format_.vcodec);\r
324                 if (!encoder)\r
325                         BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("Codec not found."));\r
326 \r
327                 auto c = st->codec;\r
328 \r
329                 avcodec_get_context_defaults3(c, encoder);\r
330                                 \r
331                 c->codec_id                     = output_format_.vcodec;\r
332                 c->codec_type           = AVMEDIA_TYPE_VIDEO;\r
333                 c->width                        = output_format_.width;\r
334                 c->height                       = output_format_.height;\r
335                 c->time_base.den        = format_desc_.time_scale;\r
336                 c->time_base.num        = format_desc_.duration;\r
337                 c->gop_size                     = 25;\r
338                 c->flags                   |= format_desc_.field_mode == core::field_mode::progressive ? 0 : (CODEC_FLAG_INTERLACED_ME | CODEC_FLAG_INTERLACED_DCT);\r
339                 if(c->pix_fmt == PIX_FMT_NONE)\r
340                         c->pix_fmt = PIX_FMT_YUV420P;\r
341 \r
342                 if(c->codec_id == CODEC_ID_PRORES)\r
343                 {                       \r
344                         c->bit_rate     = c->width < 1280 ? 63*1000000 : 220*1000000;\r
345                         c->pix_fmt      = PIX_FMT_YUV422P10;\r
346                 }\r
347                 else if(c->codec_id == CODEC_ID_DNXHD)\r
348                 {\r
349                         if(c->width < 1280 || c->height < 720)\r
350                                 BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("Unsupported video dimensions."));\r
351 \r
352                         c->bit_rate     = 220*1000000;\r
353                         c->pix_fmt      = PIX_FMT_YUV422P;\r
354                 }\r
355                 else if(c->codec_id == CODEC_ID_DVVIDEO)\r
356                 {\r
357                         c->width = c->height == 1280 ? 960  : c->width;\r
358                         \r
359                         if(format_desc_.format == core::video_format::ntsc)\r
360                                 c->pix_fmt = PIX_FMT_YUV411P;\r
361                         else if(format_desc_.format == core::video_format::pal)\r
362                                 c->pix_fmt = PIX_FMT_YUV420P;\r
363                         else // dv50\r
364                                 c->pix_fmt = PIX_FMT_YUV422P;\r
365                         \r
366                         if(format_desc_.duration == 1001)                       \r
367                                 c->width = c->height == 1080 ? 1280 : c->width;                 \r
368                         else\r
369                                 c->width = c->height == 1080 ? 1440 : c->width;                 \r
370                 }\r
371                 else if(c->codec_id == CODEC_ID_H264)\r
372                 {                          \r
373                         c->pix_fmt = PIX_FMT_YUV420P;    \r
374                         if(options.empty())\r
375                         {\r
376                                 av_opt_set(c->priv_data, "preset", "ultrafast", 0);\r
377                                 av_opt_set(c->priv_data, "tune",   "fastdecode",   0);\r
378                                 av_opt_set(c->priv_data, "crf",    "5",     0);\r
379                         }\r
380                 }\r
381                 else if(c->codec_id == CODEC_ID_QTRLE)\r
382                 {\r
383                         c->pix_fmt = PIX_FMT_ARGB;\r
384                 }\r
385                                 \r
386                 c->max_b_frames = 0; // b-frames not supported.\r
387                                 \r
388                 boost::range::remove_erase_if(options, [&](const option& o)\r
389                 {\r
390                         return ffmpeg::av_opt_set(c, o.name.c_str(), o.value.c_str(), AV_OPT_SEARCH_CHILDREN) > -1 ||\r
391                                    ffmpeg::av_opt_set(c->priv_data, o.name.c_str(), o.value.c_str(), AV_OPT_SEARCH_CHILDREN) > -1;\r
392                 });\r
393                                 \r
394                 if(output_format_.format->flags & AVFMT_GLOBALHEADER)\r
395                         c->flags |= CODEC_FLAG_GLOBAL_HEADER;\r
396                 \r
397                 c->thread_count = boost::thread::hardware_concurrency();\r
398                 if(avcodec_open(c, encoder) < 0)\r
399                 {\r
400                         c->thread_count = 1;\r
401                         THROW_ON_ERROR2(avcodec_open(c, encoder), "[ffmpeg_consumer]");\r
402                 }\r
403 \r
404                 return std::shared_ptr<AVStream>(st, [](AVStream* st)\r
405                 {\r
406                         LOG_ON_ERROR2(avcodec_close(st->codec), "[ffmpeg_consumer]");\r
407                         av_freep(&st->codec);\r
408                         av_freep(&st);\r
409                 });\r
410         }\r
411                 \r
412         std::shared_ptr<AVStream> add_audio_stream(std::vector<option>& options)\r
413         {\r
414                 if(output_format_.acodec == CODEC_ID_NONE)\r
415                         return nullptr;\r
416 \r
417                 auto st = av_new_stream(oc_.get(), 1);\r
418                 if(!st)\r
419                         BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("Could not allocate audio-stream") << boost::errinfo_api_function("av_new_stream"));               \r
420                 \r
421                 auto encoder = avcodec_find_encoder(output_format_.acodec);\r
422                 if (!encoder)\r
423                         BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("codec not found"));\r
424                 \r
425                 auto c = st->codec;\r
426 \r
427                 avcodec_get_context_defaults3(c, encoder);\r
428 \r
429                 c->codec_id                     = output_format_.acodec;\r
430                 c->codec_type           = AVMEDIA_TYPE_AUDIO;\r
431                 c->sample_rate          = 48000;\r
432                 c->channels                     = 2;\r
433                 c->sample_fmt           = SAMPLE_FMT_S16;\r
434 \r
435                 if(output_format_.vcodec == CODEC_ID_FLV1)              \r
436                         c->sample_rate  = 44100;                \r
437 \r
438                 if(output_format_.format->flags & AVFMT_GLOBALHEADER)\r
439                         c->flags |= CODEC_FLAG_GLOBAL_HEADER;\r
440                                 \r
441                 boost::range::remove_erase_if(options, [&](const option& o)\r
442                 {\r
443                         return ffmpeg::av_opt_set(c, o.name.c_str(), o.value.c_str(), AV_OPT_SEARCH_CHILDREN) > -1;\r
444                 });\r
445 \r
446                 THROW_ON_ERROR2(avcodec_open(c, encoder), "[ffmpeg_consumer]");\r
447 \r
448                 return std::shared_ptr<AVStream>(st, [](AVStream* st)\r
449                 {\r
450                         LOG_ON_ERROR2(avcodec_close(st->codec), "[ffmpeg_consumer]");;\r
451                         av_freep(&st->codec);\r
452                         av_freep(&st);\r
453                 });\r
454         }\r
455 \r
456         std::shared_ptr<AVFrame> convert_video(core::read_frame& frame, AVCodecContext* c)\r
457         {\r
458                 if(!sws_) \r
459                 {\r
460                         sws_.reset(sws_getContext(format_desc_.width, format_desc_.height, PIX_FMT_BGRA, c->width, c->height, c->pix_fmt, SWS_BICUBIC, nullptr, nullptr, nullptr), sws_freeContext);\r
461                         if (sws_ == nullptr) \r
462                                 BOOST_THROW_EXCEPTION(caspar_exception() << msg_info("Cannot initialize the conversion context"));\r
463                 }\r
464 \r
465                 std::shared_ptr<AVFrame> in_frame(avcodec_alloc_frame(), av_free);\r
466                 avpicture_fill(reinterpret_cast<AVPicture*>(in_frame.get()), const_cast<uint8_t*>(frame.image_data().begin()), PIX_FMT_BGRA, format_desc_.width, format_desc_.height);\r
467                                 \r
468                 std::shared_ptr<AVFrame> out_frame(avcodec_alloc_frame(), av_free);\r
469                 picture_buf_.resize(avpicture_get_size(c->pix_fmt, c->width, c->height));\r
470                 avpicture_fill(reinterpret_cast<AVPicture*>(out_frame.get()), picture_buf_.data(), c->pix_fmt, c->width, c->height);\r
471 \r
472                 sws_scale(sws_.get(), in_frame->data, in_frame->linesize, 0, format_desc_.height, out_frame->data, out_frame->linesize);\r
473 \r
474                 return out_frame;\r
475         }\r
476   \r
477         void encode_video_frame(core::read_frame& frame)\r
478         { \r
479                 auto c = video_st_->codec;\r
480                 \r
481                 auto in_time  = static_cast<double>(in_frame_number_) / format_desc_.fps;\r
482                 auto out_time = static_cast<double>(out_frame_number_) / (static_cast<double>(c->time_base.den) / static_cast<double>(c->time_base.num));\r
483                 \r
484                 in_frame_number_++;\r
485 \r
486                 if(out_time - in_time > 0.01)\r
487                         return;\r
488  \r
489                 auto av_frame = convert_video(frame, c);\r
490                 av_frame->interlaced_frame      = format_desc_.field_mode != core::field_mode::progressive;\r
491                 av_frame->top_field_first       = format_desc_.field_mode == core::field_mode::upper;\r
492                 av_frame->pts                           = out_frame_number_++;\r
493 \r
494                 int out_size = THROW_ON_ERROR2(avcodec_encode_video(c, video_outbuf_.data(), video_outbuf_.size(), av_frame.get()), "[ffmpeg_consumer]");\r
495                 if(out_size == 0)\r
496                         return;\r
497                                 \r
498                 safe_ptr<AVPacket> pkt(new AVPacket, [](AVPacket* p)\r
499                 {\r
500                         av_free_packet(p);\r
501                         delete p;\r
502                 });\r
503                 av_init_packet(pkt.get());\r
504  \r
505                 if (c->coded_frame->pts != AV_NOPTS_VALUE)\r
506                         pkt->pts = av_rescale_q(c->coded_frame->pts, c->time_base, video_st_->time_base);\r
507 \r
508                 if(c->coded_frame->key_frame)\r
509                         pkt->flags |= AV_PKT_FLAG_KEY;\r
510 \r
511                 pkt->stream_index       = video_st_->index;\r
512                 pkt->data                       = video_outbuf_.data();\r
513                 pkt->size                       = out_size;\r
514                         \r
515                 av_interleaved_write_frame(oc_.get(), pkt.get());               \r
516         }\r
517                 \r
518         byte_vector convert_audio(core::read_frame& frame, AVCodecContext* c)\r
519         {\r
520                 if(!swr_)               \r
521                         swr_.reset(new audio_resampler(c->channels, format_desc_.audio_channels, \r
522                                                                                    c->sample_rate, format_desc_.audio_sample_rate,\r
523                                                                                    c->sample_fmt, AV_SAMPLE_FMT_S32));\r
524                 \r
525 \r
526                 auto audio_data = frame.audio_data();\r
527 \r
528                 std::vector<int8_t,  tbb::cache_aligned_allocator<int8_t>> audio_resample_buffer;\r
529                 std::copy(reinterpret_cast<const uint8_t*>(audio_data.begin()), \r
530                                   reinterpret_cast<const uint8_t*>(audio_data.begin()) + audio_data.size()*4, \r
531                                   std::back_inserter(audio_resample_buffer));\r
532                 \r
533                 audio_resample_buffer = swr_->resample(std::move(audio_resample_buffer));\r
534                 \r
535                 return byte_vector(audio_resample_buffer.begin(), audio_resample_buffer.end());\r
536         }\r
537 \r
538         void encode_audio_frame(core::read_frame& frame)\r
539         {                       \r
540                 auto c = audio_st_->codec;\r
541 \r
542                 boost::range::push_back(audio_buf_, convert_audio(frame, c));\r
543                 \r
544                 std::size_t frame_size = c->frame_size;\r
545                 auto input_audio_size = frame_size * av_get_bytes_per_sample(c->sample_fmt) * c->channels;\r
546                 \r
547                 while(audio_buf_.size() >= input_audio_size)\r
548                 {\r
549                         safe_ptr<AVPacket> pkt(new AVPacket, [](AVPacket* p)\r
550                         {\r
551                                 av_free_packet(p);\r
552                                 delete p;\r
553                         });\r
554                         av_init_packet(pkt.get());\r
555 \r
556                         if(frame_size > 1)\r
557                         {                                                               \r
558                                 pkt->size = avcodec_encode_audio(c, audio_outbuf_.data(), audio_outbuf_.size(), reinterpret_cast<short*>(audio_buf_.data()));\r
559                                 audio_buf_.erase(audio_buf_.begin(), audio_buf_.begin() + input_audio_size);\r
560                         }\r
561                         else\r
562                         {\r
563                                 audio_outbuf_ = std::move(audio_buf_);          \r
564                                 audio_buf_.clear();\r
565                                 pkt->size = audio_outbuf_.size();\r
566                                 pkt->data = audio_outbuf_.data();\r
567                         }\r
568                 \r
569                         if(pkt->size == 0)\r
570                                 return;\r
571 \r
572                         if (c->coded_frame && c->coded_frame->pts != AV_NOPTS_VALUE)\r
573                                 pkt->pts = av_rescale_q(c->coded_frame->pts, c->time_base, audio_st_->time_base);\r
574 \r
575                         pkt->flags               |= AV_PKT_FLAG_KEY;\r
576                         pkt->stream_index = audio_st_->index;\r
577                         pkt->data                 = reinterpret_cast<uint8_t*>(audio_outbuf_.data());\r
578                 \r
579                         av_interleaved_write_frame(oc_.get(), pkt.get());\r
580                 }\r
581         }\r
582                  \r
583         void send(const safe_ptr<core::read_frame>& frame)\r
584         {\r
585                 encode_executor_.begin_invoke([=]\r
586                 {               \r
587                         boost::timer frame_timer;\r
588 \r
589                         encode_video_frame(*frame);\r
590                         encode_audio_frame(*frame);\r
591 \r
592                         graph_->set_value("frame-time", frame_timer.elapsed()*format_desc_.fps*0.5);                    \r
593                 });\r
594         }\r
595 };\r
596 \r
597 struct ffmpeg_consumer_proxy : public core::frame_consumer\r
598 {\r
599         const std::wstring                              filename_;\r
600         const std::vector<option>                       options_;\r
601 \r
602         std::unique_ptr<ffmpeg_consumer> consumer_;\r
603 \r
604 public:\r
605 \r
606         ffmpeg_consumer_proxy(const std::wstring& filename, const std::vector<option>& options)\r
607                 : filename_(filename)\r
608                 , options_(options)\r
609         {\r
610         }\r
611         \r
612         virtual void initialize(const core::video_format_desc& format_desc, int)\r
613         {\r
614                 consumer_.reset();\r
615                 consumer_.reset(new ffmpeg_consumer(narrow(filename_), format_desc, options_));\r
616         }\r
617         \r
618         virtual bool send(const safe_ptr<core::read_frame>& frame) override\r
619         {\r
620                 consumer_->send(frame);\r
621                 return true;\r
622         }\r
623         \r
624         virtual std::wstring print() const override\r
625         {\r
626                 return consumer_ ? consumer_->print() : L"[ffmpeg_consumer]";\r
627         }\r
628 \r
629         virtual boost::property_tree::wptree info() const override\r
630         {\r
631                 boost::property_tree::wptree info;\r
632                 info.add(L"type", L"ffmpeg-consumer");\r
633                 info.add(L"filename", filename_);\r
634                 return info;\r
635         }\r
636                 \r
637         virtual bool has_synchronization_clock() const override\r
638         {\r
639                 return false;\r
640         }\r
641 \r
642         virtual size_t buffer_depth() const override\r
643         {\r
644                 return 1;\r
645         }\r
646 \r
647         virtual int index() const override\r
648         {\r
649                 return 200;\r
650         }\r
651 };      \r
652 \r
653 safe_ptr<core::frame_consumer> create_consumer(const std::vector<std::wstring>& params)\r
654 {\r
655         if(params.size() < 1 || params[0] != L"FILE")\r
656                 return core::frame_consumer::empty();\r
657         \r
658         auto filename   = (params.size() > 1 ? params[1] : L"");\r
659                         \r
660         std::vector<option> options;\r
661         \r
662         if(params.size() >= 3)\r
663         {\r
664                 for(auto opt_it = params.begin()+2; opt_it != params.end();)\r
665                 {\r
666                         auto name  = narrow(boost::trim_copy(boost::to_lower_copy(*opt_it++))).substr(1);\r
667                         auto value = narrow(boost::trim_copy(boost::to_lower_copy(*opt_it++)));\r
668                                 \r
669                         if(value == "h264")\r
670                                 value = "libx264";\r
671                         else if(value == "dvcpro")\r
672                                 value = "dvvideo";\r
673 \r
674                         options.push_back(option(name, value));\r
675                 }\r
676         }\r
677                 \r
678         return make_safe<ffmpeg_consumer_proxy>(env::media_folder() + filename, options);\r
679 }\r
680 \r
681 safe_ptr<core::frame_consumer> create_consumer(const boost::property_tree::wptree& ptree)\r
682 {\r
683         auto filename   = ptree.get<std::wstring>(L"path");\r
684         auto codec              = ptree.get(L"vcodec", L"libx264");\r
685 \r
686         std::vector<option> options;\r
687         options.push_back(option("vcodec", narrow(codec)));\r
688         \r
689         return make_safe<ffmpeg_consumer_proxy>(env::media_folder() + filename, options);\r
690 }\r
691 \r
692 }}\r