]> git.sesse.net Git - casparcg/blobdiff - core/mixer/image/image_mixer.cpp
2.0. image_mixer: Refactored and reduced memory usage.
[casparcg] / core / mixer / image / image_mixer.cpp
index 4b531ecf1e39242cb784be6c0b4b67c34a3583ce..ae8fec69ddf1bee20f56f712b42ce0434cba160a 100644 (file)
@@ -25,7 +25,9 @@
 #include "../gpu/ogl_device.h"\r
 #include "../gpu/host_buffer.h"\r
 #include "../gpu/device_buffer.h"\r
-#include "../gpu/gpu_write_frame.h"\r
+#include "../write_frame.h"\r
+\r
+#include "../../video_channel_context.h"\r
 \r
 #include <common/concurrency/executor.h>\r
 #include <common/exception/exceptions.h>\r
 #include <core/producer/frame/pixel_format.h>\r
 #include <core/video_format.h>\r
 \r
-#include <boost/foreach.hpp>\r
+#include <gl/glew.h>\r
 \r
-#include <Glee.h>\r
-#include <SFML/Window/Context.hpp>\r
+#include <boost/foreach.hpp>\r
+#include <boost/range.hpp>\r
+#include <boost/range/algorithm/find.hpp>\r
 \r
+#include <algorithm>\r
 #include <array>\r
+#include <deque>\r
 #include <unordered_map>\r
 \r
-namespace caspar { namespace mixer {\r
+namespace caspar { namespace core {\r
                \r
 struct image_mixer::implementation : boost::noncopyable\r
-{                      \r
-       const core::video_format_desc format_desc_;\r
-       \r
-       std::stack<core::image_transform> transform_stack_;\r
-\r
-       GLuint fbo_;\r
-       std::array<std::shared_ptr<device_buffer>, 2> render_targets_;\r
-       std::shared_ptr<device_buffer> key_target_;\r
-       bool is_key_;\r
+{              \r
+       typedef std::deque<render_item>                 layer;\r
 \r
-       std::shared_ptr<host_buffer> reading_;\r
+       video_channel_context&                                  channel_;\r
 \r
-       image_kernel kernel_;\r
+       std::vector<image_transform>                    transform_stack_;\r
+       std::vector<video_mode::type>                   mode_stack_;\r
 \r
-       struct render_item\r
-       {\r
-               core::pixel_format_desc desc;\r
-               std::vector<safe_ptr<device_buffer>> textures;\r
-               core::image_transform transform;\r
-       };\r
+       std::deque<std::deque<render_item>>             layers_; // layer/stream/items\r
        \r
-       std::vector<render_item> waiting_queue_;\r
-       std::vector<render_item> render_queue_;\r
+       image_kernel                                                    kernel_;\r
+               \r
+       std::shared_ptr<device_buffer>                  draw_buffer_;\r
 \r
+       std::shared_ptr<device_buffer>                  local_key_buffer_;\r
+       std::shared_ptr<device_buffer>                  layer_key_buffer_;\r
+               \r
 public:\r
-       implementation(const core::video_format_desc& format_desc) \r
-               : format_desc_(format_desc)\r
-               , is_key_(false)\r
+       implementation(video_channel_context& video_channel) \r
+               : channel_(video_channel)\r
+               , transform_stack_(1)\r
+               , mode_stack_(1, video_mode::progressive)\r
        {\r
-               ogl_device::invoke([]\r
-               {\r
-                       if(!GLEE_VERSION_3_0)\r
-                               BOOST_THROW_EXCEPTION(not_supported() << msg_info("Missing OpenGL 3.0 support."));\r
-               });\r
-               \r
-               ogl_device::begin_invoke([=]\r
-               {\r
-                       transform_stack_.push(core::image_transform());\r
-                       transform_stack_.top().set_mode(core::video_mode::progressive);\r
-\r
-                       GL(glEnable(GL_TEXTURE_2D));\r
-                       GL(glDisable(GL_DEPTH_TEST));           \r
-                       \r
-                       key_target_ = ogl_device::create_device_buffer(format_desc.width, format_desc.height, 4);\r
-                       render_targets_[0] = ogl_device::create_device_buffer(format_desc.width, format_desc.height, 4);\r
-                       render_targets_[1] = ogl_device::create_device_buffer(format_desc.width, format_desc.height, 4);\r
-                       \r
-                       GL(glGenFramebuffers(1, &fbo_));                \r
-                       GL(glBindFramebuffer(GL_FRAMEBUFFER_EXT, fbo_));\r
-                       GL(glReadBuffer(GL_COLOR_ATTACHMENT0_EXT));\r
-\r
-                       reading_ = ogl_device::create_host_buffer(format_desc_.size, host_buffer::read_only);\r
-               });\r
        }\r
 \r
        ~implementation()\r
        {\r
-               glDeleteFramebuffersEXT(1, &fbo_);\r
+               channel_.ogl().gc();\r
        }\r
-\r
-       void begin(const core::basic_frame& frame)\r
+       \r
+       void begin(core::basic_frame& frame)\r
        {\r
-               transform_stack_.push(transform_stack_.top()*frame.get_image_transform());\r
+               transform_stack_.push_back(transform_stack_.back()*frame.get_image_transform());\r
+               mode_stack_.push_back(frame.get_mode() == video_mode::progressive ? mode_stack_.back() : frame.get_mode());\r
        }\r
                \r
        void visit(core::write_frame& frame)\r
-       {               \r
-               auto gpu_frame = dynamic_cast<gpu_write_frame*>(&frame);\r
-               if(!gpu_frame)\r
+       {       \r
+               CASPAR_ASSERT(!layers_.empty());\r
+\r
+               // Check if frame has been discarded by interlacing\r
+               if(boost::range::find(mode_stack_, video_mode::upper) != mode_stack_.end() && boost::range::find(mode_stack_, video_mode::lower) != mode_stack_.end())\r
                        return;\r
                \r
-               auto desc = gpu_frame->get_pixel_format_desc();\r
-               auto buffers = gpu_frame->get_plane_buffers();\r
-               auto transform = transform_stack_.top();\r
+               core::render_item item(frame.get_pixel_format_desc(), frame.get_textures(), transform_stack_.back(), mode_stack_.back(), frame.tag());  \r
 \r
-               ogl_device::begin_invoke([=]\r
-               {\r
-                       render_item item;\r
-\r
-                       item.desc = desc;\r
-                       item.transform = transform;\r
-                       \r
-                       for(size_t n = 0; n < buffers.size(); ++n)\r
-                       {\r
-                               GL(glActiveTexture(GL_TEXTURE0+n));\r
-                               auto texture = ogl_device::create_device_buffer(desc.planes[n].width, desc.planes[n].height, desc.planes[n].channels);\r
-                               texture->read(*buffers[n]);\r
-                               item.textures.push_back(texture);\r
-                       }       \r
+               auto& layer = layers_.back();\r
 \r
-                       waiting_queue_.push_back(item);\r
-               });\r
+               if(boost::range::find(layer, item) == layer.end())\r
+                       layer.push_back(item);\r
        }\r
 \r
        void end()\r
        {\r
-               transform_stack_.pop();\r
+               transform_stack_.pop_back();\r
+               mode_stack_.pop_back();\r
        }\r
 \r
-       boost::unique_future<safe_ptr<const host_buffer>> render()\r
+       void begin_layer()\r
        {\r
-               auto result = ogl_device::begin_invoke([=]() -> safe_ptr<const host_buffer>\r
-               {\r
-                       reading_->map(); // Might block.\r
-                       return make_safe(reading_);\r
-               });\r
-                       \r
-               ogl_device::begin_invoke([=]\r
-               {\r
-                       is_key_ = false;\r
-\r
-                       // Clear and bind frame-buffers.\r
-\r
-                       key_target_->attach();\r
-                       GL(glClear(GL_COLOR_BUFFER_BIT));       \r
-\r
-                       render_targets_[0]->attach();\r
-                       GL(glClear(GL_COLOR_BUFFER_BIT));\r
-\r
-                       // Render items.\r
-\r
-                       BOOST_FOREACH(auto item, render_queue_)\r
-                               render(item);                   \r
-\r
-                       // Move waiting items to queue.\r
-\r
-                       render_queue_ = std::move(waiting_queue_);\r
-\r
-                       // Start read-back.\r
-\r
-                       reading_ = ogl_device::create_host_buffer(format_desc_.size, host_buffer::read_only);\r
-                       render_targets_[0]->attach();\r
-                       render_targets_[0]->write(*reading_);\r
-                       std::swap(render_targets_[0], render_targets_[1]);\r
-               });\r
-\r
-               return std::move(result);\r
+               layers_.push_back(layer());\r
        }\r
 \r
-       void render(const render_item& item)\r
+       void end_layer()\r
+       {\r
+       }\r
+       \r
+       boost::unique_future<safe_ptr<host_buffer>> render()\r
        {               \r
-               const auto desc          = item.desc;\r
-               auto       textures      = item.textures;\r
-               const auto transform = item.transform;\r
-                               \r
-               // Bind textures\r
-\r
-               for(size_t n = 0; n < textures.size(); ++n)\r
+               auto layers = std::move(layers_);\r
+               return channel_.ogl().begin_invoke([=]()mutable\r
                {\r
-                       GL(glActiveTexture(GL_TEXTURE0+n));\r
-                       textures[n]->bind();\r
-               }               \r
+                       return render(std::move(layers));\r
+               });\r
+       }\r
+       \r
+       safe_ptr<host_buffer> render(std::deque<layer>&& layers)\r
+       {\r
+               draw_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 4);                             \r
+               channel_.ogl().clear(*draw_buffer_);\r
+                               \r
+               BOOST_FOREACH(auto& layer, layers)\r
+                       draw(std::move(layer));\r
+                               \r
+               auto host_buffer = channel_.ogl().create_host_buffer(channel_.get_format_desc().size, host_buffer::read_only);\r
+               channel_.ogl().attach(*draw_buffer_);\r
+               host_buffer->begin_read(draw_buffer_->width(), draw_buffer_->height(), format(draw_buffer_->stride()));\r
+               \r
+               GL(glFlush());\r
+               \r
+               return host_buffer;\r
+       }\r
 \r
-               // Setup key and kernel\r
+       void draw(layer&& layer)\r
+       {                                       \r
+               BOOST_FOREACH(auto& item, layer)\r
+                       draw(std::move(item));\r
+               \r
+               std::swap(local_key_buffer_, layer_key_buffer_);\r
+       }\r
 \r
-               if(transform.get_is_key())\r
+       void draw(render_item&& item)\r
+       {                                                                                       \r
+               if(item.transform.get_is_key())\r
                {\r
-                       kernel_.apply(desc, transform, false);\r
-                       if(!is_key_)\r
+                       if(!local_key_buffer_)\r
                        {\r
-                               key_target_->attach();\r
-                               is_key_ = true;\r
-                               GL(glClear(GL_COLOR_BUFFER_BIT));               \r
+                               local_key_buffer_ = channel_.ogl().create_device_buffer(channel_.get_format_desc().width, channel_.get_format_desc().height, 1);\r
+                               channel_.ogl().clear(*local_key_buffer_);\r
                        }\r
-               }               \r
-               else\r
-               {                                               \r
-                       kernel_.apply(desc, transform, is_key_);        \r
-                       if(is_key_)\r
-                       {\r
-                               is_key_ = false;\r
 \r
-                               render_targets_[0]->attach();                   \r
-                               GL(glActiveTexture(GL_TEXTURE0+3));\r
-                               key_target_->bind();\r
-                       }       \r
+                       draw(local_key_buffer_, std::move(item), nullptr, nullptr);\r
+               }\r
+               else\r
+               {\r
+                       draw(draw_buffer_, std::move(item), local_key_buffer_, layer_key_buffer_);      \r
+                       local_key_buffer_.reset();\r
+               }\r
+       }\r
+       \r
+       void draw(std::shared_ptr<device_buffer>& target, render_item&& item, const std::shared_ptr<device_buffer>& local_key, const std::shared_ptr<device_buffer>& layer_key)\r
+       {\r
+               if(!std::all_of(item.textures.begin(), item.textures.end(), std::mem_fn(&device_buffer::ready)))\r
+               {\r
+                       CASPAR_LOG(warning) << L"[image_mixer] Performance warning. Host to device transfer not complete, GPU will be stalled";\r
+                       channel_.ogl().yield(); // Try to give it some more time.\r
                }               \r
 \r
-               GL(glColor4d(1.0, 1.0, 1.0, transform.get_opacity()));\r
-               GL(glViewport(0, 0, format_desc_.width, format_desc_.height));\r
-                                               \r
-               auto m_p = transform.get_key_translation();\r
-               auto m_s = transform.get_key_scale();\r
-               double w = static_cast<double>(format_desc_.width);\r
-               double h = static_cast<double>(format_desc_.height);\r
-\r
-               GL(glEnable(GL_SCISSOR_TEST));\r
-               GL(glScissor(static_cast<size_t>(m_p[0]*w), static_cast<size_t>(m_p[1]*h), static_cast<size_t>(m_s[0]*w), static_cast<size_t>(m_s[1]*h)));\r
-                       \r
-               auto f_p = transform.get_fill_translation();\r
-               auto f_s = transform.get_fill_scale();\r
-                       \r
-               glBegin(GL_QUADS);\r
-                       glMultiTexCoord2d(GL_TEXTURE0, 0.0, 0.0); glMultiTexCoord2d(GL_TEXTURE1,  f_p[0]        ,  f_p[1]        );             glVertex2d( f_p[0]        *2.0-1.0,  f_p[1]        *2.0-1.0);\r
-                       glMultiTexCoord2d(GL_TEXTURE0, 1.0, 0.0); glMultiTexCoord2d(GL_TEXTURE1, (f_p[0]+f_s[0]),  f_p[1]        );             glVertex2d((f_p[0]+f_s[0])*2.0-1.0,  f_p[1]        *2.0-1.0);\r
-                       glMultiTexCoord2d(GL_TEXTURE0, 1.0, 1.0); glMultiTexCoord2d(GL_TEXTURE1, (f_p[0]+f_s[0]), (f_p[1]+f_s[1]));             glVertex2d((f_p[0]+f_s[0])*2.0-1.0, (f_p[1]+f_s[1])*2.0-1.0);\r
-                       glMultiTexCoord2d(GL_TEXTURE0, 0.0, 1.0); glMultiTexCoord2d(GL_TEXTURE1,  f_p[0]        , (f_p[1]+f_s[1]));             glVertex2d( f_p[0]        *2.0-1.0, (f_p[1]+f_s[1])*2.0-1.0);\r
-               glEnd();\r
-               GL(glDisable(GL_SCISSOR_TEST));         \r
+               kernel_.draw(channel_.ogl(), std::move(item), make_safe(target), local_key, layer_key);\r
        }\r
-                       \r
-       std::vector<safe_ptr<host_buffer>> create_buffers(const core::pixel_format_desc& format)\r
+                               \r
+       safe_ptr<write_frame> create_frame(const void* tag, const core::pixel_format_desc& desc)\r
        {\r
-               std::vector<safe_ptr<host_buffer>> buffers;\r
-               std::transform(format.planes.begin(), format.planes.end(), std::back_inserter(buffers), [&](const core::pixel_format_desc::plane& plane)\r
-               {\r
-                       return ogl_device::create_host_buffer(plane.size, host_buffer::write_only);\r
-               });\r
-               return buffers;\r
+               return make_safe<write_frame>(channel_.ogl(), tag, desc);\r
        }\r
 };\r
 \r
-image_mixer::image_mixer(const core::video_format_desc& format_desc) : impl_(new implementation(format_desc)){}\r
-void image_mixer::begin(const core::basic_frame& frame){impl_->begin(frame);}\r
+image_mixer::image_mixer(video_channel_context& video_channel) : impl_(new implementation(video_channel)){}\r
+void image_mixer::begin(core::basic_frame& frame){impl_->begin(frame);}\r
 void image_mixer::visit(core::write_frame& frame){impl_->visit(frame);}\r
 void image_mixer::end(){impl_->end();}\r
-boost::unique_future<safe_ptr<const host_buffer>> image_mixer::render(){return impl_->render();}\r
-std::vector<safe_ptr<host_buffer>> image_mixer::create_buffers(const core::pixel_format_desc& format){return impl_->create_buffers(format);}\r
+boost::unique_future<safe_ptr<host_buffer>> image_mixer::render(){return impl_->render();}\r
+safe_ptr<write_frame> image_mixer::create_frame(const void* tag, const core::pixel_format_desc& desc){return impl_->create_frame(tag, desc);}\r
+void image_mixer::begin_layer(){impl_->begin_layer();}\r
+void image_mixer::end_layer(){impl_->end_layer();}\r
+image_mixer& image_mixer::operator=(image_mixer&& other)\r
+{\r
+       impl_ = std::move(other.impl_);\r
+       return *this;\r
+}\r
 \r
 }}
\ No newline at end of file