X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=modules%2Fffmpeg%2Fproducer%2Fvideo%2Fvideo_decoder.cpp;h=f365a7c96e724dc511d076d7c65633a27ac1b4db;hb=2f549904ed6da11061fa914fc99f0e0acdd90357;hp=3ac21b4f4b7cb9bfdf99aa0ef26b546673b87f9d;hpb=9c608bb54c3446734a9a010c1452af8914942a03;p=casparcg

diff --git a/modules/ffmpeg/producer/video/video_decoder.cpp b/modules/ffmpeg/producer/video/video_decoder.cpp
index 3ac21b4f4..f365a7c96 100644
--- a/modules/ffmpeg/producer/video/video_decoder.cpp
+++ b/modules/ffmpeg/producer/video/video_decoder.cpp
@@ -21,14 +21,19 @@
 
 #include "video_decoder.h"
 
-#include <common/memory/memcpy.h>
+#include "../util.h"
+#include "../filter/filter.h"
 
-#include <core/video_format.h>
-#include <core/producer/frame/basic_frame.h>
-#include <core/producer/frame/write_frame.h>
-#include <core/producer/frame/image_transform.h>
+#include "../../ffmpeg_error.h"
+#include "../../tbb_avcodec.h"
 
-#include <tbb/parallel_for.h>
+#include <core/producer/frame/frame_transform.h>
+#include <core/producer/frame/frame_factory.h>
+
+#include <boost/range/algorithm_ext/push_back.hpp>
+#include <boost/filesystem.hpp>
+
+#include <queue>
 
 #if defined(_MSC_VER)
 #pragma warning (push)
@@ -36,9 +41,7 @@
 #endif
 extern "C" 
 {
-	#define __STDC_CONSTANT_MACROS
-	#define __STDC_LIMIT_MACROS
-	#include <libswscale/swscale.h>
+	#include <libavcodec/avcodec.h>
 	#include <libavformat/avformat.h>
 }
 #if defined(_MSC_VER)
@@ -47,151 +50,169 @@ extern "C"
 
 namespace caspar {
 	
-core::pixel_format::type get_pixel_format(PixelFormat pix_fmt)
+struct video_decoder::implementation : boost::noncopyable
 {
-	switch(pix_fmt)
-	{
-		case PIX_FMT_GRAY8:		return core::pixel_format::gray;
-		case PIX_FMT_BGRA:		return core::pixel_format::bgra;
-		case PIX_FMT_ARGB:		return core::pixel_format::argb;
-		case PIX_FMT_RGBA:		return core::pixel_format::rgba;
-		case PIX_FMT_ABGR:		return core::pixel_format::abgr;
-		case PIX_FMT_YUV444P:	return core::pixel_format::ycbcr;
-		case PIX_FMT_YUV422P:	return core::pixel_format::ycbcr;
-		case PIX_FMT_YUV420P:	return core::pixel_format::ycbcr;
-		case PIX_FMT_YUV411P:	return core::pixel_format::ycbcr;
-		case PIX_FMT_YUV410P:	return core::pixel_format::ycbcr;
-		case PIX_FMT_YUVA420P:	return core::pixel_format::ycbcra;
-		default:				return core::pixel_format::invalid;
-	}
-}
+	const safe_ptr<core::frame_factory>		frame_factory_;
+	std::shared_ptr<AVCodecContext>			codec_context_;
+	int										index_;
 
-core::pixel_format_desc get_pixel_format_desc(PixelFormat pix_fmt, size_t width, size_t height)
-{
-	// Get linesizes
-	AVPicture dummy_pict;	
-	avpicture_fill(&dummy_pict, nullptr, pix_fmt, width, height);
+	std::queue<std::shared_ptr<AVPacket>>	packets_;
 
-	core::pixel_format_desc desc;
-	desc.pix_fmt = get_pixel_format(pix_fmt);
-		
-	switch(desc.pix_fmt)
+	filter									filter_;
+
+	double									fps_;
+	int64_t									nb_frames_;
+
+	size_t									width_;
+	size_t									height_;
+
+public:
+	explicit implementation(const safe_ptr<AVFormatContext>& context, const safe_ptr<core::frame_factory>& frame_factory, const std::wstring& filter) 
+		: frame_factory_(frame_factory)
+		, filter_(filter)
+		, fps_(frame_factory_->get_video_format_desc().fps)
+		, nb_frames_(0)
+		, width_(0)
+		, height_(0)
 	{
-	case core::pixel_format::gray:
+		try
 		{
-			desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0]/4, height, 1));						
-			return desc;
+			AVCodec* dec;
+			index_ = THROW_ON_ERROR2(av_find_best_stream(context.get(), AVMEDIA_TYPE_VIDEO, -1, -1, &dec, 0), "[video_decoder]");
+						
+			THROW_ON_ERROR2(tbb_avcodec_open(context->streams[index_]->codec, dec), "[video_decoder]");
+								
+			codec_context_.reset(context->streams[index_]->codec, tbb_avcodec_close);
+		
+			CASPAR_LOG(debug) << "[video_decoder] " << context->streams[index_]->codec->codec->long_name;
+
+			// Some files give an invalid time_base numerator, try to fix it.
+
+			fix_meta_data(*context);
+			
+			fps_ = static_cast<double>(codec_context_->time_base.den) / static_cast<double>(codec_context_->time_base.num);
+			nb_frames_ = context->streams[index_]->nb_frames;
+
+			if(double_rate(filter))
+				fps_ *= 2;
+
+			width_  = codec_context_->width;
+			height_ = codec_context_->height;
 		}
-	case core::pixel_format::bgra:
-	case core::pixel_format::argb:
-	case core::pixel_format::rgba:
-	case core::pixel_format::abgr:
+		catch(...)
 		{
-			desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0]/4, height, 4));						
-			return desc;
+			index_ = THROW_ON_ERROR2(av_find_best_stream(context.get(), AVMEDIA_TYPE_AUDIO, -1, -1, nullptr, 0), "[video_decoder]");
+
+			CASPAR_LOG_CURRENT_EXCEPTION();
+			CASPAR_LOG(warning) << "[video_decoder] Failed to open video-stream. Running without video.";	
 		}
-	case core::pixel_format::ycbcr:
-	case core::pixel_format::ycbcra:
-		{		
-			// Find chroma height
-			size_t size2 = dummy_pict.data[2] - dummy_pict.data[1];
-			size_t h2 = size2/dummy_pict.linesize[1];			
-
-			desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[0], height, 1));
-			desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[1], h2, 1));
-			desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[2], h2, 1));
-
-			if(desc.pix_fmt == core::pixel_format::ycbcra)						
-				desc.planes.push_back(core::pixel_format_desc::plane(dummy_pict.linesize[3], height, 1));	
-			return desc;
-		}		
-	default:		
-		desc.pix_fmt = core::pixel_format::invalid;
-		return desc;
 	}
-}
 
-struct video_decoder::implementation : boost::noncopyable
-{	
-	std::shared_ptr<core::frame_factory> frame_factory_;
-	std::shared_ptr<SwsContext> sws_context_;
+	void push(const std::shared_ptr<AVPacket>& packet)
+	{
+		if(packet && packet->stream_index != index_)
+			return;
 
-	AVCodecContext* codec_context_;
+		packets_.push(packet);
+	}
 
-	const int width_;
-	const int height_;
-	const PixelFormat pix_fmt_;
-	core::pixel_format_desc desc_;
+	std::vector<std::shared_ptr<AVFrame>> poll()
+	{		
+		std::vector<std::shared_ptr<AVFrame>> result;
 
-public:
-	explicit implementation(AVCodecContext* codec_context, const safe_ptr<core::frame_factory>& frame_factory) 
-		: frame_factory_(frame_factory)
-		, codec_context_(codec_context)
-		, width_(codec_context_->width)
-		, height_(codec_context_->height)
-		, pix_fmt_(codec_context_->pix_fmt)
-		, desc_(get_pixel_format_desc(pix_fmt_, width_, height_))
-	{
-		if(desc_.pix_fmt == core::pixel_format::invalid)
+		if(packets_.empty())
+			return result;
+
+		if(!codec_context_)
+			return empty_poll();
+
+		auto packet = packets_.front();
+					
+		if(packet)
+		{			
+			BOOST_FOREACH(auto& frame, decode(*packet))
+				boost::range::push_back(result, filter_.execute(frame));
+
+			if(packet->size == 0)
+				packets_.pop();
+		}
+		else
 		{
-			CASPAR_LOG(warning) << "Hardware accelerated color transform not supported.";
-
-			desc_ = get_pixel_format_desc(PIX_FMT_BGRA, width_, height_);
-			double param;
-			sws_context_.reset(sws_getContext(width_, height_, pix_fmt_, width_, height_, PIX_FMT_BGRA, SWS_BILINEAR, nullptr, nullptr, &param), sws_freeContext);
-			if(!sws_context_)
-				BOOST_THROW_EXCEPTION(operation_failed() <<
-									  msg_info("Could not create software scaling context.") << 
-									  boost::errinfo_api_function("sws_getContext"));
+			if(codec_context_->codec->capabilities & CODEC_CAP_DELAY)
+			{
+				AVPacket pkt;
+				av_init_packet(&pkt);
+				pkt.data = nullptr;
+				pkt.size = 0;
+
+				BOOST_FOREACH(auto& frame, decode(pkt))
+					boost::range::push_back(result, filter_.execute(frame));	
+			}
+
+			if(result.empty())
+			{					
+				packets_.pop();
+				avcodec_flush_buffers(codec_context_.get());
+				result.push_back(nullptr);
+			}
 		}
+		
+		return result;
 	}
-	
-	safe_ptr<core::write_frame> execute(void* tag, const aligned_buffer& video_packet)
+
+	std::vector<std::shared_ptr<AVFrame>> empty_poll()
 	{				
-		safe_ptr<AVFrame> decoded_frame(avcodec_alloc_frame(), av_free);
+		auto packet = packets_.front();
+		packets_.pop();
+
+		if(!packet)			
+			return boost::assign::list_of(nullptr);
+
+		std::shared_ptr<AVFrame> frame(avcodec_alloc_frame(), av_free);
+		frame->data[0] = nullptr;
+
+		return boost::assign::list_of(frame);					
+	}
+
+	std::vector<std::shared_ptr<AVFrame>> decode(AVPacket& pkt)
+	{
+		std::shared_ptr<AVFrame> decoded_frame(avcodec_alloc_frame(), av_free);
 
 		int frame_finished = 0;
-		const int result = avcodec_decode_video(codec_context_, decoded_frame.get(), &frame_finished, video_packet.data(), video_packet.size());
+		THROW_ON_ERROR2(avcodec_decode_video2(codec_context_.get(), decoded_frame.get(), &frame_finished, &pkt), "[video_decocer]");
 		
-		if(result < 0)
-			BOOST_THROW_EXCEPTION(invalid_operation() << msg_info("avcodec_decode_video failed"));
+		// If a decoder consumes less then the whole packet then something is wrong
+		// that might be just harmless padding at the end, or a problem with the
+		// AVParser or demuxer which puted more then one frame in a AVPacket.
+		pkt.data = nullptr;
+		pkt.size = 0;
+
+		if(frame_finished == 0)	
+			return std::vector<std::shared_ptr<AVFrame>>();
+
+		if(decoded_frame->repeat_pict % 2 > 0)
+			CASPAR_LOG(warning) << "[video_decoder]: Field repeat_pict not implemented.";
 		
-		auto write = frame_factory_->create_frame(tag, desc_);
-		if(sws_context_ == nullptr)
-		{
-			tbb::parallel_for(0, static_cast<int>(desc_.planes.size()), 1, [&](int n)
-			{
-				auto plane            = desc_.planes[n];
-				auto result           = write->image_data(n).begin();
-				auto decoded          = decoded_frame->data[n];
-				auto decoded_linesize = decoded_frame->linesize[n];
-				
-				// Copy line by line since ffmpeg sometimes pads each line.
-				tbb::parallel_for(0, static_cast<int>(desc_.planes[n].height), 1, [&](int y)
-				{
-					fast_memcpy(result + y*plane.linesize, decoded + y*decoded_linesize, plane.linesize);
-				});
-			});
-		}
-		else
-		{
-			// Uses sws_scale when we don't support the provided color-space.
-			safe_ptr<AVFrame> av_frame(avcodec_alloc_frame(), av_free);	
-			avcodec_get_frame_defaults(av_frame.get());			
-			avpicture_fill(reinterpret_cast<AVPicture*>(av_frame.get()), write->image_data().begin(), PIX_FMT_BGRA, width_, height_);
-		 
-			sws_scale(sws_context_.get(), decoded_frame->data, decoded_frame->linesize, 0, height_, av_frame->data, av_frame->linesize);	
-		}	
-
-		// DVVIDEO is in lower field. Make it upper field if needed.
-		if(codec_context_->codec_id == CODEC_ID_DVVIDEO && frame_factory_->get_video_format_desc().mode == core::video_mode::upper)
-			write->get_image_transform().set_fill_translation(0.0f, 1.0/static_cast<double>(height_));
-
-		return write;
+		return std::vector<std::shared_ptr<AVFrame>>(1 + decoded_frame->repeat_pict/2, decoded_frame);
+	}
+	
+	bool ready() const
+	{
+		return !packets_.empty();
+	}
+	
+	double fps() const
+	{
+		return fps_;
 	}
 };
 
-video_decoder::video_decoder(AVCodecContext* codec_context, const safe_ptr<core::frame_factory>& frame_factory) : impl_(new implementation(codec_context, frame_factory)){}
-safe_ptr<core::write_frame> video_decoder::execute(void* tag, const aligned_buffer& video_packet){return impl_->execute(tag, video_packet);}
-
+video_decoder::video_decoder(const safe_ptr<AVFormatContext>& context, const safe_ptr<core::frame_factory>& frame_factory, const std::wstring& filter) : impl_(new implementation(context, frame_factory, filter)){}
+void video_decoder::push(const std::shared_ptr<AVPacket>& packet){impl_->push(packet);}
+std::vector<std::shared_ptr<AVFrame>> video_decoder::poll(){return impl_->poll();}
+bool video_decoder::ready() const{return impl_->ready();}
+double video_decoder::fps() const{return impl_->fps();}
+int64_t video_decoder::nb_frames() const{return impl_->nb_frames_;}
+size_t video_decoder::width() const{return impl_->width_;}
+size_t video_decoder::height() const{return impl_->height_;}
 }
\ No newline at end of file