X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=core%2Fmixer%2Fimage%2Fimage_kernel.cpp;h=1fd83d91d5d8b0b0efd6a32cd21f8c4adaa70c80;hb=116e09a218cf056e4de868454b0fe26dc4db1413;hp=0ca341aa8e2bd70148474b947736f48c784d09eb;hpb=0c70e709c449ebad9ac295aa88332137a810aa7e;p=casparcg diff --git a/core/mixer/image/image_kernel.cpp b/core/mixer/image/image_kernel.cpp index 0ca341aa8..1fd83d91d 100644 --- a/core/mixer/image/image_kernel.cpp +++ b/core/mixer/image/image_kernel.cpp @@ -21,16 +21,20 @@ #include "image_kernel.h" +#include "image_shader.h" + #include "blending_glsl.h" #include "../gpu/shader.h" #include "../gpu/device_buffer.h" +#include "../gpu/ogl_device.h" #include #include +#include #include #include -#include +#include #include @@ -54,368 +58,151 @@ GLubyte lower_pattern[] = { struct image_kernel::implementation : boost::noncopyable { - std::unique_ptr shader_; - - core::video_mode::type last_mode_; - size_t last_width_; - size_t last_height_; - - //std::string get_blend_color_func() - //{ - // return - // - // get_blend_glsl() - // - // + - // - // "vec3 get_blend_color(vec3 back, vec3 fore) \n" - // "{ \n" - // " switch(blend_mode) \n" - // " { \n" - // " case 0: return BlendNormal(back, fore); \n" - // " case 1: return BlendLighten(back, fore); \n" - // " case 2: return BlendDarken(back, fore); \n" - // " case 3: return BlendMultiply(back, fore); \n" - // " case 4: return BlendAverage(back, fore); \n" - // " case 5: return BlendAdd(back, fore); \n" - // " case 6: return BlendSubstract(back, fore); \n" - // " case 7: return BlendDifference(back, fore); \n" - // " case 8: return BlendNegation(back, fore); \n" - // " case 9: return BlendExclusion(back, fore); \n" - // " case 10: return BlendScreen(back, fore); \n" - // " case 11: return BlendOverlay(back, fore); \n" - // //" case 12: return BlendSoftLight(back, fore); \n" - // " case 13: return BlendHardLight(back, fore); \n" - // " case 14: return BlendColorDodge(back, fore); \n" - // " case 15: return BlendColorBurn(back, fore); \n" - // " case 16: return BlendLinearDodge(back, fore); \n" - // " case 17: return BlendLinearBurn(back, fore); \n" - // " case 18: return BlendLinearLight(back, fore); \n" - // " case 19: return BlendVividLight(back, fore); \n" - // " case 20: return BlendPinLight(back, fore); \n" - // " case 21: return BlendHardMix(back, fore); \n" - // " case 22: return BlendReflect(back, fore); \n" - // " case 23: return BlendGlow(back, fore); \n" - // " case 24: return BlendPhoenix(back, fore); \n" - // " case 25: return BlendHue(back, fore); \n" - // " case 26: return BlendSaturation(back, fore); \n" - // " case 27: return BlendColor(back, fore); \n" - // " case 28: return BlendLuminosity(back, fore); \n" - // " } \n" - // " return BlendNormal(back, fore); \n" - // "} \n" - // " \n" - // "vec4 blend_color(vec4 fore) \n" - // "{ \n" - // " vec4 back = texture2D(background, gl_TexCoord[1].st); \n" - // " if(levels) \n" - // " fore.rgb = LevelsControl(fore.rgb, min_input, max_input, gamma, min_output, max_output); \n" - // " if(csb) \n" - // " fore.rgb = ContrastSaturationBrightness(fore.rgb, brt, sat, con); \n" - // " fore.rgb = get_blend_color(back.bgr, fore.rgb); \n" - // " \n" - // " return vec4(mix(back.rgb, fore.rgb, fore.a), back.a + fore.a); \n" - // "} \n"; - //} - // - //std::string get_simple_blend_color_func() - //{ - // return - - // "vec4 blend_color(vec4 fore) \n" - // "{ \n" - // " vec4 back = texture2D(background, gl_TexCoord[1].st); \n" - // " return vec4(mix(back.rgb, fore.rgb, fore.a), back.a + fore.a); \n" - // "} \n"; - //} - - std::string get_vertex() - { - return - - "void main() \n" - "{ \n" - " gl_TexCoord[0] = gl_MultiTexCoord0; \n" - " gl_TexCoord[1] = gl_MultiTexCoord1; \n" - " gl_FrontColor = gl_Color; \n" - " gl_Position = ftransform(); \n" - "} \n"; - } - - std::string get_fragment(bool compability_mode) - { - return - - "#version 120 \n" - "uniform sampler2D background; \n" - "uniform sampler2D plane[4]; \n" - "uniform sampler2D local_key; \n" - "uniform sampler2D layer_key; \n" - " \n" - "uniform bool is_hd; \n" - "uniform bool has_local_key; \n" - "uniform bool has_layer_key; \n" - "uniform int blend_mode; \n" - "uniform int alpha_mode; \n" - "uniform int pixel_format; \n" - " \n" - "uniform bool levels; \n" - "uniform float min_input; \n" - "uniform float max_input; \n" - "uniform float gamma; \n" - "uniform float min_output; \n" - "uniform float max_output; \n" - " \n" - "uniform bool csb; \n" - "uniform float brt; \n" - "uniform float sat; \n" - "uniform float con; \n" - " \n" - "//http://slouken.blogspot.com/2011/02/mpeg-acceleration-with-glsl.html \n" - "vec4 ycbcra_to_rgba_sd(float y, float cb, float cr, float a) \n" - "{ \n" - " // YUV offset \n" - " const vec3 offset = vec3(-0.0625, -0.5, -0.5); \n" - " \n" - " // RGB coefficients \n" - " const vec3 Rcoeff = vec3(1.164, 0.000, 1.596); \n" - " const vec3 Gcoeff = vec3(1.164, -0.391, -0.813); \n" - " const vec3 Bcoeff = vec3(1.164, 2.018, 0.000); \n" - " \n" - " vec3 yuv = vec3(y, cr, cb); \n" - " vec4 rgba; \n" - " \n" - " yuv += offset; \n" - " rgba.r = dot(yuv, Rcoeff); \n" - " rgba.g = dot(yuv, Gcoeff); \n" - " rgba.b = dot(yuv, Bcoeff); \n" - " rgba.a = a; \n" - " \n" - " return rgba; \n" - "} \n" - " \n" - "vec4 ycbcra_to_rgba_hd(float y, float cb, float cr, float a) \n" - "{ \n" - " // YUV offset \n" - " const vec3 offset = vec3(-0.0625, -0.5, -0.5); \n" - " \n" - " // RGB coefficients \n" - " const vec3 Rcoeff = vec3(1.164, 0.000, 1.793); \n" - " const vec3 Gcoeff = vec3(1.164, -0.213, -0.534); \n" - " const vec3 Bcoeff = vec3(1.164, 2.115, 0.000); \n" - " \n" - " vec3 yuv = vec3(y, cr, cb); \n" - " vec4 rgba; \n" - " \n" - " yuv += offset; \n" - " rgba.r = dot(yuv, Rcoeff); \n" - " rgba.g = dot(yuv, Gcoeff); \n" - " rgba.b = dot(yuv, Bcoeff); \n" - " rgba.a = a; \n" - " \n" - " return rgba; \n" - "} \n" - " \n" - "vec4 ycbcra_to_rgba(float y, float cb, float cr, float a) \n" - "{ \n" - " if(is_hd) \n" - " return ycbcra_to_rgba_hd(y, cb, cr, a); \n" - " else \n" - " return ycbcra_to_rgba_sd(y, cb, cr, a); \n" - "} \n" - " \n" - "vec4 get_rgba_color() \n" - "{ \n" - " switch(pixel_format) \n" - " { \n" - " case 0: //gray \n" - " return vec4(texture2D(plane[0], gl_TexCoord[0].st).rrr, 1.0); \n" - " case 1: //bgra, \n" - " return texture2D(plane[0], gl_TexCoord[0].st).bgra; \n" - " case 2: //rgba, \n" - " return texture2D(plane[0], gl_TexCoord[0].st).rgba; \n" - " case 3: //argb, \n" - " return texture2D(plane[0], gl_TexCoord[0].st).argb; \n" - " case 4: //abgr, \n" - " return texture2D(plane[0], gl_TexCoord[0].st).gbar; \n" - " case 5: //ycbcr, \n" - " { \n" - " float y = texture2D(plane[0], gl_TexCoord[0].st).r; \n" - " float cb = texture2D(plane[1], gl_TexCoord[0].st).r; \n" - " float cr = texture2D(plane[2], gl_TexCoord[0].st).r; \n" - " return ycbcra_to_rgba(y, cb, cr, 1.0); \n" - " } \n" - " case 6: //ycbcra \n" - " { \n" - " float y = texture2D(plane[0], gl_TexCoord[0].st).r; \n" - " float cb = texture2D(plane[1], gl_TexCoord[0].st).r; \n" - " float cr = texture2D(plane[2], gl_TexCoord[0].st).r; \n" - " float a = texture2D(plane[3], gl_TexCoord[0].st).r; \n" - " return ycbcra_to_rgba(y, cb, cr, a); \n" - " } \n" - " case 7: //luma \n" - " { \n" - " vec3 y3 = texture2D(plane[0], gl_TexCoord[0].st).rrr; \n" - " return vec4((y3-0.065)/0.859, 1.0); \n" - " } \n" - " } \n" - " return vec4(0.0, 0.0, 0.0, 0.0); \n" - "} \n" - " \n" - "void main() \n" - "{ \n" - " vec4 color = get_rgba_color(); \n" - " if(has_local_key) \n" - " color.a *= texture2D(local_key, gl_TexCoord[1].st).r; \n" - " if(has_layer_key) \n" - " color.a *= texture2D(layer_key, gl_TexCoord[1].st).r; \n" - " gl_FragColor = color.bgra * gl_Color; \n" - "} \n"; - } - - - implementation() - : last_mode_(core::video_mode::progressive) - , last_width_(0) - , last_height_(0) - { - } - - - void draw(const render_item& item, - const safe_ptr& background, - const std::shared_ptr& local_key, - const std::shared_ptr& layer_key) + std::shared_ptr shader_; + bool blend_modes_; + + void draw(ogl_device& ogl, draw_params&& params) { static const double epsilon = 0.001; - CASPAR_ASSERT(item.pix_desc.planes.size() == item.textures.size()); + CASPAR_ASSERT(params.pix_desc.planes.size() == params.textures.size()); - if(item.textures.empty()) + if(params.textures.empty() || !params.background) return; - if(item.transform.get_opacity() < epsilon) + if(params.transform.opacity < epsilon) return; - - if(!shader_) + + if(!std::all_of(params.textures.begin(), params.textures.end(), std::mem_fn(&device_buffer::ready))) { - try - { - shader_.reset(new shader(get_vertex(), get_fragment(false))); - } - catch(...) - { - CASPAR_LOG_CURRENT_EXCEPTION(); - CASPAR_LOG(warning) << "Failed to compile shader. Trying to compile without blend-modes."; - shader_.reset(new shader(get_vertex(), get_fragment(true))); - } + CASPAR_LOG(warning) << L"[image_mixer] Performance warning. Host to device transfer not complete, GPU will be stalled"; + ogl.yield(); // Try to give it some more time. + } + + // Bind textures + + for(size_t n = 0; n < params.textures.size(); ++n) + params.textures[n]->bind(n); + + if(params.local_key) + params.local_key->bind(texture_id::local_key); + + if(params.layer_key) + params.layer_key->bind(texture_id::layer_key); - GL(glEnable(GL_BLEND)); - GL(glBlendFuncSeparate(GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_ONE, GL_ONE)); + // Setup shader - GL(glEnable(GL_TEXTURE_2D)); - } + if(!shader_) + shader_ = get_image_shader(ogl, blend_modes_); + + ogl.use(*shader_); + + shader_->set("plane[0]", texture_id::plane0); + shader_->set("plane[1]", texture_id::plane1); + shader_->set("plane[2]", texture_id::plane2); + shader_->set("plane[3]", texture_id::plane3); + shader_->set("local_key", texture_id::local_key); + shader_->set("layer_key", texture_id::layer_key); + shader_->set("is_hd", params.pix_desc.planes.at(0).height > 700 ? 1 : 0); + shader_->set("has_local_key", params.local_key); + shader_->set("has_layer_key", params.layer_key); + shader_->set("pixel_format", params.pix_desc.pix_fmt); + shader_->set("opacity", params.transform.is_key ? 1.0 : params.transform.opacity); + + // Setup blend_func + + if(params.transform.is_key) + params.blend_mode = blend_mode::normal; - if(last_mode_ != item.mode) + if(blend_modes_) { - last_mode_ = item.mode; - - if(item.mode == core::video_mode::progressive) - GL(glDisable(GL_POLYGON_STIPPLE)); - else - { - GL(glEnable(GL_POLYGON_STIPPLE)); + params.background->bind(6); - if(item.mode == core::video_mode::upper) - glPolygonStipple(upper_pattern); - else if(item.mode == core::video_mode::lower) - glPolygonStipple(lower_pattern); - } + shader_->set("background", texture_id::background); + shader_->set("blend_mode", params.blend_mode); } - - if(last_width_ != background->width() || last_height_ != background->height()) + else { - last_width_ = background->width(); - last_height_ = background->height(); - GL(glViewport(0, 0, background->width(), background->height())); + switch(params.blend_mode) + { + case blend_mode::mix: + ogl.blend_func(GL_ONE, GL_ONE); + break; + default: + ogl.blend_func(GL_ONE, GL_ONE_MINUS_SRC_ALPHA); + } } - // Bind textures - - for(size_t n = 0; n < item.textures.size(); ++n) - item.textures[n]->bind(n); - - if(local_key) - local_key->bind(4); + // Setup image-adjustements - if(layer_key) - layer_key->bind(5); - - background->bind(6); - - // Setup shader - - shader_->use(); - - shader_->set("plane[0]", 0); - shader_->set("plane[1]", 1); - shader_->set("plane[2]", 2); - shader_->set("plane[3]", 3); - shader_->set("local_key", 4); - shader_->set("layer_key", 5); - shader_->set("background", 6); - shader_->set("is_hd", item.pix_desc.planes.at(0).height > 700 ? 1 : 0); - shader_->set("has_local_key", local_key ? 1 : 0); - shader_->set("has_layer_key", layer_key ? 1 : 0); - shader_->set("blend_mode", item.transform.get_is_key() ? core::image_transform::blend_mode::normal : item.transform.get_blend_mode()); - shader_->set("alpha_mode", item.transform.get_alpha_mode()); - shader_->set("pixel_format", item.pix_desc.pix_fmt); - - auto levels = item.transform.get_levels(); - - if(levels.min_input > epsilon || - levels.max_input < 1.0-epsilon || - levels.min_output > epsilon || - levels.max_output < 1.0-epsilon || - std::abs(levels.gamma - 1.0) > epsilon) + if(params.transform.levels.min_input > epsilon || + params.transform.levels.max_input < 1.0-epsilon || + params.transform.levels.min_output > epsilon || + params.transform.levels.max_output < 1.0-epsilon || + std::abs(params.transform.levels.gamma - 1.0) > epsilon) { shader_->set("levels", true); - shader_->set("min_input", levels.min_input); - shader_->set("max_input", levels.max_input); - shader_->set("min_output", levels.min_output); - shader_->set("max_output", levels.max_output); - shader_->set("gamma", levels.gamma); + shader_->set("min_input", params.transform.levels.min_input); + shader_->set("max_input", params.transform.levels.max_input); + shader_->set("min_output", params.transform.levels.min_output); + shader_->set("max_output", params.transform.levels.max_output); + shader_->set("gamma", params.transform.levels.gamma); } else shader_->set("levels", false); - if(std::abs(item.transform.get_brightness() - 1.0) > epsilon || - std::abs(item.transform.get_saturation() - 1.0) > epsilon || - std::abs(item.transform.get_contrast() - 1.0) > epsilon) + if(std::abs(params.transform.brightness - 1.0) > epsilon || + std::abs(params.transform.saturation - 1.0) > epsilon || + std::abs(params.transform.contrast - 1.0) > epsilon) { shader_->set("csb", true); - shader_->set("brt", item.transform.get_brightness()); - shader_->set("sat", item.transform.get_saturation()); - shader_->set("con", item.transform.get_contrast()); + shader_->set("brt", params.transform.brightness); + shader_->set("sat", params.transform.saturation); + shader_->set("con", params.transform.contrast); } else shader_->set("csb", false); + // Setup interlacing + + if(params.transform.field_mode == core::field_mode::progressive) + ogl.disable(GL_POLYGON_STIPPLE); + else + { + ogl.enable(GL_POLYGON_STIPPLE); + + if(params.transform.field_mode == core::field_mode::upper) + ogl.stipple_pattern(upper_pattern); + else if(params.transform.field_mode == core::field_mode::lower) + ogl.stipple_pattern(lower_pattern); + } + // Setup drawing area + + ogl.viewport(0, 0, params.background->width(), params.background->height()); + + auto m_p = params.transform.clip_translation; + auto m_s = params.transform.clip_scale; - GL(glColor4d(item.transform.get_gain(), item.transform.get_gain(), item.transform.get_gain(), item.transform.get_opacity())); - - auto m_p = item.transform.get_clip_translation(); - auto m_s = item.transform.get_clip_scale(); - double w = static_cast(background->width()); - double h = static_cast(background->height()); + bool scissor = m_p[0] > std::numeric_limits::epsilon() || m_p[1] > std::numeric_limits::epsilon() || + m_s[0] < (1.0 - std::numeric_limits::epsilon()) || m_s[1] < (1.0 - std::numeric_limits::epsilon()); - GL(glEnable(GL_SCISSOR_TEST)); - GL(glScissor(static_cast(m_p[0]*w), static_cast(m_p[1]*h), static_cast(m_s[0]*w), static_cast(m_s[1]*h))); - - auto f_p = item.transform.get_fill_translation(); - auto f_s = item.transform.get_fill_scale(); + if(scissor) + { + double w = static_cast(params.background->width()); + double h = static_cast(params.background->height()); + + ogl.enable(GL_SCISSOR_TEST); + ogl.scissor(static_cast(m_p[0]*w), static_cast(m_p[1]*h), static_cast(m_s[0]*w), static_cast(m_s[1]*h)); + } + + auto f_p = params.transform.fill_translation; + auto f_s = params.transform.fill_scale; + + // Set render target + + ogl.attach(*params.background); // Draw @@ -426,19 +213,26 @@ struct image_kernel::implementation : boost::noncopyable glMultiTexCoord2d(GL_TEXTURE0, 0.0, 1.0); glMultiTexCoord2d(GL_TEXTURE1, f_p[0] , (f_p[1]+f_s[1])); glVertex2d( f_p[0] *2.0-1.0, (f_p[1]+f_s[1])*2.0-1.0); glEnd(); - GL(glDisable(GL_SCISSOR_TEST)); + // Cleanup + + ogl.disable(GL_SCISSOR_TEST); + + params.textures.clear(); + ogl.yield(); // Return resources to pool as early as possible. + + if(blend_modes_) + { + // http://www.opengl.org/registry/specs/NV/texture_barrier.txt + // This allows us to use framebuffer (background) both as source and target while blending. + glTextureBarrierNV(); + } } }; image_kernel::image_kernel() : impl_(new implementation()){} -void image_kernel::draw(const render_item& item, const safe_ptr& background, const std::shared_ptr& local_key, const std::shared_ptr& layer_key) -{ - impl_->draw(item, background, local_key, layer_key); -} - -bool operator==(const render_item& lhs, const render_item& rhs) +void image_kernel::draw(ogl_device& ogl, draw_params&& params) { - return lhs.textures == rhs.textures && lhs.transform == rhs.transform && lhs.tag == rhs.tag && lhs.mode == rhs.mode; + impl_->draw(ogl, std::move(params)); } }} \ No newline at end of file