#include <core/producer/frame/pixel_format.h>\r
#include <core/video_format.h>\r
\r
+#include <gl/glew.h>\r
+\r
#include <boost/foreach.hpp>\r
+#include <boost/range.hpp>\r
+#include <boost/range/algorithm/find.hpp>\r
\r
+#include <algorithm>\r
#include <array>\r
+#include <deque>\r
#include <unordered_map>\r
\r
namespace caspar { namespace core {\r
\r
struct image_mixer::implementation : boost::noncopyable\r
-{ \r
- static const size_t LOCAL_KEY_INDEX = 3;\r
- static const size_t LAYER_KEY_INDEX = 4;\r
-\r
- struct render_item\r
- {\r
- pixel_format_desc desc;\r
- std::vector<safe_ptr<device_buffer>> textures;\r
- core::image_transform transform;\r
- };\r
+{ \r
+ typedef std::deque<render_item> layer;\r
\r
video_channel_context& channel_;\r
- \r
- std::stack<core::image_transform> transform_stack_;\r
- std::queue<std::queue<render_item>> render_queue_;\r
- \r
- image_kernel kernel_;\r
- \r
- safe_ptr<host_buffer> read_buffer_;\r
- safe_ptr<device_buffer> draw_buffer_;\r
- safe_ptr<device_buffer> write_buffer_;\r
\r
- safe_ptr<device_buffer> local_key_buffer_;\r
- safe_ptr<device_buffer> layer_key_buffer_;\r
+ std::vector<image_transform> transform_stack_;\r
+ std::vector<video_mode::type> video_mode_stack_;\r
+ std::stack<blend_mode::type> blend_mode_stack_;\r
\r
- bool local_key_;\r
- bool layer_key_;\r
+ std::deque<std::deque<render_item>> layers_; // layer/stream/items\r
\r
+ image_kernel kernel_; \r
+\r
+ std::shared_ptr<device_buffer> active_buffer_;\r
public:\r
implementation(video_channel_context& video_channel) \r
: channel_(video_channel)\r
- , read_buffer_(video_channel.ogl().create_host_buffer(video_channel.get_format_desc().size, host_buffer::read_only))\r
- , draw_buffer_(video_channel.ogl().create_device_buffer(video_channel.get_format_desc().width, channel_.get_format_desc().height, 4))\r
- , write_buffer_ (video_channel.ogl().create_device_buffer(video_channel.get_format_desc().width, channel_.get_format_desc().height, 4))\r
- , local_key_buffer_(video_channel.ogl().create_device_buffer(video_channel.get_format_desc().width, channel_.get_format_desc().height, 1))\r
- , layer_key_buffer_(video_channel.ogl().create_device_buffer(video_channel.get_format_desc().width, channel_.get_format_desc().height, 1))\r
- , local_key_(false)\r
- , layer_key_(false)\r
+ , transform_stack_(1)\r
+ , video_mode_stack_(1, video_mode::progressive)\r
{\r
- transform_stack_.push(core::image_transform());\r
-\r
- channel_.ogl().invoke([=]\r
- {\r
- if(!GLEE_VERSION_3_0)\r
- CASPAR_LOG(warning) << "Missing OpenGL 3.0 support.";//BOOST_THROW_EXCEPTION(not_supported() << msg_info("Missing OpenGL 3.0 support."));\r
- });\r
}\r
\r
- void begin(const core::basic_frame& frame)\r
+ ~implementation()\r
+ {\r
+ channel_.ogl().gc();\r
+ }\r
+ \r
+ void begin(core::basic_frame& frame)\r
{\r
- transform_stack_.push(transform_stack_.top()*frame.get_image_transform());\r
+ transform_stack_.push_back(transform_stack_.back()*frame.get_image_transform());\r
+ video_mode_stack_.push_back(frame.get_mode() == video_mode::progressive ? video_mode_stack_.back() : frame.get_mode());\r
}\r
\r
void visit(core::write_frame& frame)\r
- { \r
- render_item item = {frame.get_pixel_format_desc(), frame.get_textures(), transform_stack_.top()*frame.get_image_transform()}; \r
- render_queue_.back().push(item);\r
+ { \r
+ CASPAR_ASSERT(!layers_.empty());\r
+\r
+ // Check if frame has been discarded by interlacing\r
+ if(boost::range::find(video_mode_stack_, video_mode::upper) != video_mode_stack_.end() && boost::range::find(video_mode_stack_, video_mode::lower) != video_mode_stack_.end())\r
+ return;\r
+ \r
+ core::render_item item;\r
+ item.pix_desc = frame.get_pixel_format_desc();\r
+ item.textures = frame.get_textures();\r
+ item.transform = transform_stack_.back();\r
+ item.mode = video_mode_stack_.back();\r
+ item.tag = frame.tag();\r
+ item.blend_mode = blend_mode_stack_.top(); \r
+\r
+ auto& layer = layers_.back();\r
+ if(boost::range::find(layer, item) == layer.end())\r
+ layer.push_back(item);\r
}\r
\r
void end()\r
{\r
- transform_stack_.pop();\r
+ transform_stack_.pop_back();\r
+ video_mode_stack_.pop_back();\r
}\r
\r
- void begin_layer()\r
+ void begin_layer(blend_mode::type blend_mode)\r
{\r
- render_queue_.push(std::queue<render_item>());\r
+ blend_mode_stack_.push(blend_mode);\r
+ layers_.push_back(layer());\r
}\r
\r
void end_layer()\r
{\r
+ blend_mode_stack_.pop();\r
}\r
-\r
- void reinitialize_buffers()\r
- {\r
- read_buffer_ = channel_.ogl().create_host_buffer(channel_.get_format_desc().size, host_buffer::read_only);\r
- draw_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 4);\r
- write_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 4);\r
- local_key_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 1);\r
- layer_key_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 1);\r
- channel_.ogl().gc();\r
- }\r
-\r
- safe_ptr<host_buffer> render()\r
+ \r
+ boost::unique_future<safe_ptr<host_buffer>> render()\r
{ \r
- auto read_buffer = read_buffer_;\r
- auto result = channel_.ogl().begin_invoke([=]() -> safe_ptr<host_buffer>\r
+ auto layers = std::move(layers_);\r
+ return channel_.ogl().begin_invoke([=]() mutable\r
{\r
- read_buffer->map();\r
- return read_buffer;\r
+ return render(std::move(layers));\r
});\r
+ }\r
+ \r
+ safe_ptr<host_buffer> render(std::deque<layer>&& layers)\r
+ {\r
+ std::shared_ptr<device_buffer> layer_key_buffer;\r
\r
- auto render_queue = std::move(render_queue_);\r
-\r
- channel_.ogl().begin_invoke([=]() mutable\r
- {\r
- if(draw_buffer_->width() != channel_.get_format_desc().width || draw_buffer_->height() != channel_.get_format_desc().height)\r
- reinitialize_buffers();\r
-\r
- local_key_ = false;\r
- layer_key_ = false;\r
+ auto draw_buffer = create_device_buffer(4);\r
+ \r
+ BOOST_FOREACH(auto& layer, layers)\r
+ draw(std::move(layer), draw_buffer, layer_key_buffer);\r
+ \r
+ auto host_buffer = channel_.ogl().create_host_buffer(channel_.get_format_desc().size, host_buffer::read_only);\r
+ channel_.ogl().attach(*draw_buffer);\r
+ host_buffer->begin_read(draw_buffer->width(), draw_buffer->height(), format(draw_buffer->stride()));\r
+ \r
+ active_buffer_ = draw_buffer;\r
\r
- // Clear buffers.\r
- local_key_buffer_->clear();\r
- layer_key_buffer_->clear();\r
- draw_buffer_->clear();\r
+ channel_.ogl().flush(); // NOTE: This is important, otherwise fences will deadlock.\r
+ \r
+ return host_buffer;\r
+ }\r
\r
- // Draw items in device.\r
+ // TODO: We might have more overlaps for opacity transitions\r
+ // TODO: What about blending modes, are they ok? Maybe only overlap detection is required for opacity?\r
+ void draw(layer&& layer, const safe_ptr<device_buffer>& draw_buffer, std::shared_ptr<device_buffer>& layer_key_buffer)\r
+ { \r
+ if(layer.empty())\r
+ return;\r
\r
- while(!render_queue.empty())\r
- {\r
- auto layer = render_queue.front();\r
- render_queue.pop();\r
+ std::pair<int, std::shared_ptr<device_buffer>> local_key_buffer;\r
\r
- draw_buffer_->attach(); \r
+ if(has_overlapping_items(layer, layer.front().blend_mode))\r
+ {\r
+ auto local_draw_buffer = create_device_buffer(4); \r
+ auto local_blend_mode = layer.front().blend_mode;\r
\r
- while(!layer.empty())\r
+ int fields = 0;\r
+ BOOST_FOREACH(auto& item, layer)\r
+ {\r
+ if(fields & item.mode)\r
+ item.blend_mode = blend_mode::normal; // Disable blending, it will be used when merging back into render stack.\r
+ else\r
{\r
- draw(layer.front());\r
- layer.pop();\r
- channel_.ogl().yield(); // Allow quick buffer allocation to execute.\r
+ item.blend_mode = blend_mode::replace; // Target field is empty, no blending, just copy\r
+ fields |= item.mode;\r
}\r
\r
- layer_key_ = local_key_; // If there was only key in last layer then use it as key for the entire next layer.\r
- local_key_ = false;\r
-\r
- std::swap(local_key_buffer_, layer_key_buffer_);\r
+ draw_item(std::move(item), local_draw_buffer, local_key_buffer, layer_key_buffer); \r
}\r
+ \r
+ render_item item;\r
+ item.pix_desc.pix_fmt = pixel_format::bgra;\r
+ item.pix_desc.planes.push_back(pixel_format_desc::plane(channel_.get_format_desc().width, channel_.get_format_desc().height, 4));\r
+ item.textures.push_back(local_draw_buffer);\r
+ item.blend_mode = local_blend_mode;\r
+\r
+ kernel_.draw(channel_.ogl(), std::move(item), draw_buffer, nullptr, nullptr);\r
+ }\r
+ else // fast path\r
+ {\r
+ BOOST_FOREACH(auto& item, layer) \r
+ draw_item(std::move(item), draw_buffer, local_key_buffer, layer_key_buffer); \r
+ } \r
\r
- std::swap(draw_buffer_, write_buffer_);\r
-\r
- // Start transfer from device to host. \r
- read_buffer_ = channel_.ogl().create_host_buffer(channel_.get_format_desc().size, host_buffer::read_only); \r
- write_buffer_->write(*read_buffer_);\r
- });\r
+ CASPAR_ASSERT(local_key_buffer.first == 0 || local_key_buffer.first == core::video_mode::progressive);\r
\r
- return std::move(result.get());\r
+ std::swap(local_key_buffer.second, layer_key_buffer);\r
}\r
- \r
- void draw(const render_item& item)\r
- { \r
- // Bind textures\r
\r
- for(size_t n = 0; n < item.textures.size(); ++n)\r
- item.textures[n]->bind(n); \r
-\r
- // Setup key and kernel\r
-\r
- bool local_key = false;\r
- bool layer_key = false;\r
- \r
- if(item.transform.get_is_key()) // This is a key frame, render it to the local_key buffer for later use.\r
+ void draw_item(render_item&& item, \r
+ const safe_ptr<device_buffer>& draw_buffer, \r
+ std::pair<int, std::shared_ptr<device_buffer>>& local_key_buffer, \r
+ std::shared_ptr<device_buffer>& layer_key_buffer)\r
+ { \r
+ if(item.transform.get_is_key())\r
{\r
- if(!local_key_) // Initialize local-key if it is not active.\r
+ if(!local_key_buffer.second)\r
{\r
- local_key_buffer_->clear();\r
- local_key_buffer_->attach();\r
- local_key_ = true;\r
+ local_key_buffer.first = 0;\r
+ local_key_buffer.second = create_device_buffer(1);\r
}\r
- } \r
- else // This is a normal frame. Use key buffers if they are active.\r
- { \r
- local_key = local_key_;\r
- layer_key = layer_key_;\r
-\r
- if(local_key_) // Use local key if we have it.\r
+ \r
+ local_key_buffer.first |= item.mode; // Add field to flag.\r
+ kernel_.draw(channel_.ogl(), std::move(item), make_safe(local_key_buffer.second), nullptr, nullptr);\r
+ }\r
+ else\r
+ {\r
+ kernel_.draw(channel_.ogl(), std::move(item), draw_buffer, local_key_buffer.second, layer_key_buffer);\r
+ local_key_buffer.first ^= item.mode; // Remove field from flag.\r
+ \r
+ if(local_key_buffer.first == 0) // If all fields from key has been used, reset it\r
{\r
- local_key_buffer_->bind(LOCAL_KEY_INDEX);\r
- draw_buffer_->attach(); \r
- local_key_ = false; // Use it only one time.\r
- } \r
-\r
- if(layer_key_) // Use layer key if we have it.\r
- layer_key_buffer_->bind(LAYER_KEY_INDEX);\r
- } \r
+ local_key_buffer.first = 0;\r
+ local_key_buffer.second.reset();\r
+ }\r
+ }\r
+ }\r
\r
- // Draw\r
+ //// TODO: Optimize\r
+ bool has_overlapping_items(const layer& layer, blend_mode::type blend_mode)\r
+ {\r
+ if(layer.size() < 2)\r
+ return false; \r
+ \r
+ if(blend_mode == blend_mode::normal)\r
+ return false;\r
+ \r
+ return std::any_of(layer.begin(), layer.end(), [&](const render_item& item)\r
+ {\r
+ return item.tag != layer.front().tag;\r
+ });\r
\r
- kernel_.draw(channel_.get_format_desc().width, channel_.get_format_desc().height, item.desc, item.transform, local_key, layer_key); \r
+ //std::copy_if(layer.begin(), layer.end(), std::back_inserter(fill), [&](const render_item& item)\r
+ //{\r
+ // return !item.transform.get_is_key();\r
+ //});\r
+ // \r
+ //if(blend_mode == blend_mode::normal) // only overlap if opacity\r
+ //{\r
+ // return std::any_of(fill.begin(), fill.end(), [&](const render_item& item)\r
+ // {\r
+ // return item.transform.get_opacity() < 1.0 - 0.001;\r
+ // });\r
+ //}\r
+\r
+ //// simple solution, just check if we have differnt video streams / tags.\r
+ //return std::any_of(fill.begin(), fill.end(), [&](const render_item& item)\r
+ //{\r
+ // return item.tag != fill.front().tag;\r
+ //});\r
+ } \r
+ \r
+ safe_ptr<device_buffer> create_device_buffer(size_t stride)\r
+ {\r
+ auto buffer = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, stride);\r
+ channel_.ogl().clear(*buffer);\r
+ return buffer;\r
}\r
- \r
- safe_ptr<write_frame> create_frame(void* tag, const core::pixel_format_desc& desc)\r
+\r
+ safe_ptr<write_frame> create_frame(const void* tag, const core::pixel_format_desc& desc)\r
{\r
- return make_safe<write_frame>(channel_.ogl(), reinterpret_cast<int>(tag), desc);\r
+ return make_safe<write_frame>(channel_.ogl(), tag, desc);\r
}\r
};\r
\r
image_mixer::image_mixer(video_channel_context& video_channel) : impl_(new implementation(video_channel)){}\r
-void image_mixer::begin(const core::basic_frame& frame){impl_->begin(frame);}\r
+void image_mixer::begin(core::basic_frame& frame){impl_->begin(frame);}\r
void image_mixer::visit(core::write_frame& frame){impl_->visit(frame);}\r
void image_mixer::end(){impl_->end();}\r
-safe_ptr<host_buffer> image_mixer::render(){return impl_->render();}\r
-safe_ptr<write_frame> image_mixer::create_frame(void* tag, const core::pixel_format_desc& desc){return impl_->create_frame(tag, desc);}\r
-void image_mixer::begin_layer(){impl_->begin_layer();}\r
+boost::unique_future<safe_ptr<host_buffer>> image_mixer::render(){return impl_->render();}\r
+safe_ptr<write_frame> image_mixer::create_frame(const void* tag, const core::pixel_format_desc& desc){return impl_->create_frame(tag, desc);}\r
+void image_mixer::begin_layer(blend_mode::type blend_mode){impl_->begin_layer(blend_mode);}\r
void image_mixer::end_layer(){impl_->end_layer();}\r
image_mixer& image_mixer::operator=(image_mixer&& other)\r
{\r