Add support for Y'CbCr output.

author Steinar H. Gunderson <sgunderson@bigfoot.com>

Wed, 9 Sep 2015 21:51:48 +0000 (23:51 +0200)

committer Steinar H. Gunderson <sgunderson@bigfoot.com>

Wed, 9 Sep 2015 21:52:44 +0000 (23:52 +0200)
author Steinar H. Gunderson <sgunderson@bigfoot.com>
Wed, 9 Sep 2015 21:51:48 +0000 (23:51 +0200)
committer Steinar H. Gunderson <sgunderson@bigfoot.com>
Wed, 9 Sep 2015 21:52:44 +0000 (23:52 +0200)
diff --git a/.gitignore b/.gitignore

index 366d38c3b149bb0e45736b6acfaaccd3c01253c2..74045c5cdec3b8d2abb0eaa1eec8ffb80ece57dd 100644 (file)
--- a/.gitignore
+++ b/.gitignore
@@ -40,6 +40,7 @@ fp16_test
  luma_mix_effect_test
  slice_effect_test
  vignette_effect_test
+ycbcr_conversion_effect_test
  chain-*.frag
  movit.info
  coverage/
diff --git a/Makefile.in b/Makefile.in

index 35fc71ec0ab4e6c9a4a586e33ddb867f91fc6bc2..53eb6ffc1611a404a632cc6b68a3c9bd0c5f98eb 100644 (file)
--- a/Makefile.in
+++ b/Makefile.in
@@ -76,6 +76,7 @@ TESTED_EFFECTS += slice_effect
  TESTED_EFFECTS += complex_modulate_effect
  TESTED_EFFECTS += luma_mix_effect
  TESTED_EFFECTS += fft_convolution_effect
+TESTED_EFFECTS += ycbcr_conversion_effect
  
  UNTESTED_EFFECTS = sandbox_effect
  UNTESTED_EFFECTS += mirror_effect
diff --git a/effect_chain.cpp b/effect_chain.cpp

index 519cb2c6b9ea1c5816ead123b05260904519f96e..e1ae832e934a0deedb482b152e4a452f99f47b17 100644 (file)
--- a/effect_chain.cpp
+++ b/effect_chain.cpp
@@ -25,6 +25,7 @@
  #include "input.h"
  #include "resource_pool.h"
  #include "util.h"
+#include "ycbcr_conversion_effect.h"
  
  using namespace std;
  
@@ -74,6 +75,20 @@ void EffectChain::add_output(const ImageFormat &format, OutputAlphaFormat alpha_
         assert(!finalized);
         output_format = format;
         output_alpha_format = alpha_format;
+       output_color_type = OUTPUT_COLOR_RGB;
+}
+
+void EffectChain::add_ycbcr_output(const ImageFormat &format, OutputAlphaFormat alpha_format,
+                                   const YCbCrFormat &ycbcr_format)
+{
+       assert(!finalized);
+       output_format = format;
+       output_alpha_format = alpha_format;
+       output_color_type = OUTPUT_COLOR_YCBCR;
+       output_ycbcr_format = ycbcr_format;
+
+       assert(ycbcr_format.chroma_subsampling_x == 1);
+       assert(ycbcr_format.chroma_subsampling_y == 1);
  }
  
  Node *EffectChain::add_node(Effect *effect)
@@ -1363,6 +1378,22 @@ void EffectChain::fix_output_gamma()
                 connect_nodes(output, conversion);
         }
  }
+
+// If the user has requested Y'CbCr output, we need to do this conversion
+// _after_ GammaCompressionEffect etc., but before dither (see below).
+// This is because Y'CbCr, with the exception of a special optional mode
+// in Rec. 2020 (which we currently don't support), is defined to work on
+// gamma-encoded data.
+void EffectChain::add_ycbcr_conversion_if_needed()
+{
+       assert(output_color_type == OUTPUT_COLOR_RGB || output_color_type == OUTPUT_COLOR_YCBCR);
+       if (output_color_type != OUTPUT_COLOR_YCBCR) {
+               return;
+       }
+       Node *output = find_output_node();
+       Node *ycbcr = add_node(new YCbCrConversionEffect(output_ycbcr_format));
+       connect_nodes(output, ycbcr);
+}
         
  // If the user has requested dither, add a DitherEffect right at the end
  // (after GammaCompressionEffect etc.). This needs to be done after everything else,
@@ -1445,11 +1476,13 @@ void EffectChain::finalize()
         fix_internal_gamma_by_asking_inputs(15);
         fix_internal_gamma_by_inserting_nodes(16);
  
-       output_dot("step17-before-dither.dot");
+       output_dot("step17-before-ycbcr.dot");
+       add_ycbcr_conversion_if_needed();
  
+       output_dot("step18-before-dither.dot");
         add_dither_if_needed();
  
-       output_dot("step18-final.dot");
+       output_dot("step19-final.dot");
         
         // Construct all needed GLSL programs, starting at the output.
         // We need to keep track of which effects have already been computed,
@@ -1458,7 +1491,7 @@ void EffectChain::finalize()
         map<Node *, Phase *> completed_effects;
         construct_phase(find_output_node(), &completed_effects);
  
-       output_dot("step19-split-to-phases.dot");
+       output_dot("step20-split-to-phases.dot");
  
         assert(phases[0]->inputs.empty());
         
diff --git a/effect_chain.h b/effect_chain.h

index 2f088b607feeec92fd3bb98c69be5cafde2329dd..d1ab0a205148bd9d8a22e285a448d758a5fd7e00 100644 (file)
--- a/effect_chain.h
+++ b/effect_chain.h
@@ -29,6 +29,7 @@
  #include <vector>
  
  #include "image_format.h"
+#include "ycbcr.h"
  
  namespace movit {
  
@@ -162,8 +163,15 @@ public:
         }
         Effect *add_effect(Effect *effect, const std::vector<Effect *> &inputs);
  
+       // Adds an RGB output. Note that you can only have one output.
         void add_output(const ImageFormat &format, OutputAlphaFormat alpha_format);
  
+       // Adds an YCbCr output. Note that you can only have one output.
+       // Currently, only chunked packed output is supported, and only 4:4:4
+       // (so chroma_subsampling_x and chroma_subsampling_y must both be 1).
+       void add_ycbcr_output(const ImageFormat &format, OutputAlphaFormat alpha_format,
+                             const YCbCrFormat &ycbcr_format);
+
         // Set number of output bits, to scale the dither.
         // 8 is the right value for most outputs.
         // The default, 0, is a special value that means no dither.
@@ -303,12 +311,17 @@ private:
         void fix_internal_gamma_by_asking_inputs(unsigned step);
         void fix_internal_gamma_by_inserting_nodes(unsigned step);
         void fix_output_gamma();
+       void add_ycbcr_conversion_if_needed();
         void add_dither_if_needed();
  
         float aspect_nom, aspect_denom;
         ImageFormat output_format;
         OutputAlphaFormat output_alpha_format;
  
+       enum OutputColorType { OUTPUT_COLOR_RGB, OUTPUT_COLOR_YCBCR };
+       OutputColorType output_color_type;
+       YCbCrFormat output_ycbcr_format;  // If output_color_type == OUTPUT_COLOR_YCBCR.
+
         std::vector<Node *> nodes;
         std::map<Effect *, Node *> node_map;
         Effect *dither_effect;
diff --git a/test_util.cpp b/test_util.cpp

index a3ccb5c5f04cebcd3c804c294e95e93d7b886a59..2073bc2d6d3e31550dc6657c77d8664253203739 100644 (file)
--- a/test_util.cpp
+++ b/test_util.cpp
@@ -47,7 +47,7 @@ void vertical_flip(T *data, unsigned width, unsigned height)
  EffectChainTester::EffectChainTester(const float *data, unsigned width, unsigned height,
                                       MovitPixelFormat pixel_format, Colorspace color_space, GammaCurve gamma_curve,
                                       GLenum framebuffer_format)
-       : chain(width, height, get_static_pool()), width(width), height(height), finalized(false)
+       : chain(width, height, get_static_pool()), width(width), height(height), output_added(false), finalized(false)
  {
         CHECK(init_movit(".", MOVIT_DEBUG_OFF));
  
@@ -215,13 +215,28 @@ void EffectChainTester::run(unsigned char *out_data, GLenum format, Colorspace c
         vertical_flip(out_data, width, height);
  }
  
+void EffectChainTester::add_output(const ImageFormat &format, OutputAlphaFormat alpha_format)
+{
+       chain.add_output(format, alpha_format);
+       output_added = true;
+}
+
+void EffectChainTester::add_ycbcr_output(const ImageFormat &format, OutputAlphaFormat alpha_format, const YCbCrFormat &ycbcr_format)
+{
+       chain.add_ycbcr_output(format, alpha_format, ycbcr_format);
+       output_added = true;
+}
+
  void EffectChainTester::finalize_chain(Colorspace color_space, GammaCurve gamma_curve, OutputAlphaFormat alpha_format)
  {
         assert(!finalized);
-       ImageFormat image_format;
-       image_format.color_space = color_space;
-       image_format.gamma_curve = gamma_curve;
-       chain.add_output(image_format, alpha_format);
+       if (!output_added) {
+               ImageFormat image_format;
+               image_format.color_space = color_space;
+               image_format.gamma_curve = gamma_curve;
+               chain.add_output(image_format, alpha_format);
+               output_added = true;
+       }
         chain.finalize();
         finalized = true;
  }
diff --git a/test_util.h b/test_util.h

index e5e65513ddb82914758162080fabae40e039a7de..f413a39ca65251681b53c169d9e874da48988d2a 100644 (file)
--- a/test_util.h
+++ b/test_util.h
@@ -23,6 +23,8 @@ public:
         Input *add_input(const unsigned char *data, MovitPixelFormat pixel_format, Colorspace color_space, GammaCurve gamma_curve, int input_width = -1, int input_height = -1);
         void run(float *out_data, GLenum format, Colorspace color_space, GammaCurve gamma_curve, OutputAlphaFormat alpha_format = OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED);
         void run(unsigned char *out_data, GLenum format, Colorspace color_space, GammaCurve gamma_curve, OutputAlphaFormat alpha_format = OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED);
+       void add_output(const ImageFormat &format, OutputAlphaFormat alpha_format);
+       void add_ycbcr_output(const ImageFormat &format, OutputAlphaFormat alpha_format, const YCbCrFormat &ycbcr_format);
  
  private:
         void finalize_chain(Colorspace color_space, GammaCurve gamma_curve, OutputAlphaFormat alpha_format);
@@ -30,6 +32,7 @@ private:
         EffectChain chain;
         GLuint fbo, texnum;
         unsigned width, height;
+       bool output_added;
         bool finalized;
  };
  
diff --git a/ycbcr.h b/ycbcr.h

index 9179b1958a5cdcc73e1a5b74132a9b2bab45d3c8..4eb9e73185794fc0118ec2590e4303892dfa8595 100644 (file)
--- a/ycbcr.h
+++ b/ycbcr.h
@@ -1,7 +1,8 @@
  #ifndef _MOVIT_YCBCR_H
  #define _MOVIT_YCBCR_H 1
  
-// Shared utility functions between YCbCrInput and YCbCr422InterleavedInput.
+// Shared utility functions between YCbCrInput, YCbCr422InterleavedInput
+// and YCbCrConversionEffect.
  //
  // Conversion from integer to floating-point representation in case of
  // Y'CbCr is seemingly tricky:
diff --git a/ycbcr_conversion_effect.cpp b/ycbcr_conversion_effect.cpp

new file mode 100644 (file)

index 0000000..74ca789
--- /dev/null
+++ b/ycbcr_conversion_effect.cpp
@@ -0,0 +1,47 @@
+#include <epoxy/gl.h>
+#include <assert.h>
+#include <stdio.h>
+#include <algorithm>
+#include <Eigen/Core>
+#include <Eigen/LU>
+
+#include "ycbcr_conversion_effect.h"
+#include "effect_util.h"
+#include "util.h"
+#include "ycbcr.h"
+
+using namespace std;
+using namespace Eigen;
+
+namespace movit {
+
+YCbCrConversionEffect::YCbCrConversionEffect(const YCbCrFormat &ycbcr_format)
+       : ycbcr_format(ycbcr_format)
+{
+}
+
+string YCbCrConversionEffect::output_fragment_shader()
+{
+       float offset[3];
+       Matrix3d ycbcr_to_rgb;
+       compute_ycbcr_matrix(ycbcr_format, offset, &ycbcr_to_rgb);
+
+        string frag_shader = output_glsl_mat3("PREFIX(ycbcr_matrix)", ycbcr_to_rgb.inverse());
+        frag_shader += output_glsl_vec3("PREFIX(offset)", offset[0], offset[1], offset[2]);
+
+       if (ycbcr_format.full_range) {
+               // The card will clamp for us later.
+               frag_shader += "#define YCBCR_CLAMP_RANGE 0\n";
+       } else {
+               frag_shader += "#define YCBCR_CLAMP_RANGE 1\n";
+
+               // These limits come from BT.601 page 8, or BT.701, page 5.
+               // TODO: Use num_levels. Currently we support 8-bit levels only.
+               frag_shader += output_glsl_vec3("PREFIX(ycbcr_min)", 16.0 / 255.0, 16.0 / 255.0, 16.0 / 255.0);
+               frag_shader += output_glsl_vec3("PREFIX(ycbcr_max)", 235.0 / 255.0, 240.0 / 255.0, 240.0 / 255.0);
+       }
+
+       return frag_shader + read_file("ycbcr_conversion_effect.frag");
+}
+
+}  // namespace movit
diff --git a/ycbcr_conversion_effect.frag b/ycbcr_conversion_effect.frag

new file mode 100644 (file)

index 0000000..6bc29b1
--- /dev/null
+++ b/ycbcr_conversion_effect.frag
@@ -0,0 +1,24 @@
+uniform sampler2D PREFIX(tex_y);
+uniform sampler2D PREFIX(tex_cb);
+uniform sampler2D PREFIX(tex_cr);
+
+vec4 FUNCNAME(vec2 tc) {
+       vec4 rgba = INPUT(tc);
+       vec4 ycbcr_a;
+
+       ycbcr_a.rgb = PREFIX(ycbcr_matrix) * rgba.rgb + PREFIX(offset);
+
+#if YCBCR_CLAMP_RANGE
+       // If we use limited-range Y'CbCr, the card's usual 0–255 clamping
+       // won't be enough, so we need to clamp ourselves here.
+       //
+       // We clamp before dither, which is a bit unfortunate, since
+       // it means dither can take us out of the clamped range again.
+       // However, since DitherEffect never adds enough dither to change
+       // the quantized levels, we will be fine in practice.
+       ycbcr_a.rgb = clamp(ycbcr_a.rgb, PREFIX(ycbcr_min), PREFIX(ycbcr_max));
+#endif
+
+       ycbcr_a.a = rgba.a;
+       return ycbcr_a;
+}
diff --git a/ycbcr_conversion_effect.h b/ycbcr_conversion_effect.h

new file mode 100644 (file)

index 0000000..46113bf
--- /dev/null
+++ b/ycbcr_conversion_effect.h
@@ -0,0 +1,35 @@
+#ifndef _MOVIT_YCBCR_CONVERSION_EFFECT_H
+#define _MOVIT_YCBCR_CONVERSION_EFFECT_H 1
+
+// Converts from R'G'B' to Y'CbCr; that is, more or less the opposite of YCbCrInput,
+// except that it keeps the data as 4:4:4 chunked Y'CbCr; you'll need to subsample
+// and/or convert to planar somehow else.
+
+#include <epoxy/gl.h>
+#include <string>
+
+#include "effect.h"
+#include "ycbcr.h"
+
+namespace movit {
+
+class YCbCrConversionEffect : public Effect {
+private:
+       // Should not be instantiated by end users;
+       // call EffectChain::add_ycbcr_output() instead.
+       YCbCrConversionEffect(const YCbCrFormat &ycbcr_format);
+       friend class EffectChain;
+
+public:
+       virtual std::string effect_type_id() const { return "YCbCrConversionEffect"; }
+       std::string output_fragment_shader();
+       virtual AlphaHandling alpha_handling() const { return DONT_CARE_ALPHA_TYPE; }
+       virtual bool one_to_one_sampling() const { return true; }
+
+private:
+       YCbCrFormat ycbcr_format;
+};
+
+}  // namespace movit
+
+#endif // !defined(_MOVIT_YCBCR_CONVERSION_EFFECT_H)
diff --git a/ycbcr_conversion_effect_test.cpp b/ycbcr_conversion_effect_test.cpp

new file mode 100644 (file)

index 0000000..c067baf
--- /dev/null
+++ b/ycbcr_conversion_effect_test.cpp
@@ -0,0 +1,185 @@
+// Unit tests for YCbCrConversionEffect. Mostly done by leveraging
+// YCbCrInput and seeing that the right thing comes out at the
+// other end.
+
+#include <epoxy/gl.h>
+#include <math.h>
+
+#include "effect_chain.h"
+#include "gtest/gtest.h"
+#include "image_format.h"
+#include "test_util.h"
+#include "util.h"
+#include "ycbcr_input.h"
+
+namespace movit {
+
+TEST(YCbCrConversionEffectTest, BasicInOut) {
+       const int width = 1;
+       const int height = 5;
+
+       // Pure-color test inputs, calculated with the formulas in Rec. 601
+       // section 2.5.4.
+       unsigned char y[width * height] = {
+               16, 235, 81, 145, 41,
+       };
+       unsigned char cb[width * height] = {
+               128, 128, 90, 54, 240,
+       };
+       unsigned char cr[width * height] = {
+               128, 128, 240, 34, 110,
+       };
+       unsigned char expected_data[width * height * 4] = {
+               // The same data, just rearranged.
+                16, 128, 128, 255,
+               235, 128, 128, 255,
+                81,  90, 240, 255,
+               145,  54,  34, 255,
+                41, 240, 110, 255
+       };
+
+       unsigned char out_data[width * height * 4];
+
+       EffectChainTester tester(NULL, width, height);
+
+       ImageFormat format;
+       format.color_space = COLORSPACE_sRGB;
+       format.gamma_curve = GAMMA_sRGB;
+
+       YCbCrFormat ycbcr_format;
+       ycbcr_format.luma_coefficients = YCBCR_REC_601;
+       ycbcr_format.full_range = false;
+       ycbcr_format.num_levels = 256;
+       ycbcr_format.chroma_subsampling_x = 1;
+       ycbcr_format.chroma_subsampling_y = 1;
+       ycbcr_format.cb_x_position = 0.5f;
+       ycbcr_format.cb_y_position = 0.5f;
+       ycbcr_format.cr_x_position = 0.5f;
+       ycbcr_format.cr_y_position = 0.5f;
+
+       tester.add_ycbcr_output(format, OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED, ycbcr_format);
+
+       YCbCrInput *input = new YCbCrInput(format, ycbcr_format, width, height);
+       input->set_pixel_data(0, y);
+       input->set_pixel_data(1, cb);
+       input->set_pixel_data(2, cr);
+       tester.get_chain()->add_input(input);
+
+       tester.run(out_data, GL_RGBA, COLORSPACE_sRGB, GAMMA_sRGB);
+       expect_equal(expected_data, out_data, 4 * width, height);
+}
+
+TEST(YCbCrConversionEffectTest, ClampToValidRange) {
+       const int width = 1;
+       const int height = 6;
+
+       // Some out-of-range of at-range values.
+       // Y should be clamped to 16-235 and Cb/Cr to 16-240.
+       // (Alpha should still be 255.)
+       unsigned char y[width * height] = {
+               0, 10, 16, 235, 240, 255
+       };
+       unsigned char cb[width * height] = {
+               0, 10, 16, 235, 240, 255,
+       };
+       unsigned char cr[width * height] = {
+               255, 240, 235, 16, 10, 0,
+       };
+       unsigned char expected_data[width * height * 4] = {
+               16, 16, 240, 255,
+               16, 16, 240, 255,
+               16, 16, 235, 255,
+               235, 235, 16, 255,
+               235, 240, 16, 255,
+               235, 240, 16, 255,
+       };
+
+       unsigned char out_data[width * height * 4];
+
+       EffectChainTester tester(NULL, width, height);
+
+       ImageFormat format;
+       format.color_space = COLORSPACE_sRGB;
+       format.gamma_curve = GAMMA_sRGB;
+
+       YCbCrFormat ycbcr_format;
+       ycbcr_format.luma_coefficients = YCBCR_REC_601;
+       ycbcr_format.full_range = false;
+       ycbcr_format.num_levels = 256;
+       ycbcr_format.chroma_subsampling_x = 1;
+       ycbcr_format.chroma_subsampling_y = 1;
+       ycbcr_format.cb_x_position = 0.5f;
+       ycbcr_format.cb_y_position = 0.5f;
+       ycbcr_format.cr_x_position = 0.5f;
+       ycbcr_format.cr_y_position = 0.5f;
+
+       tester.add_ycbcr_output(format, OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED, ycbcr_format);
+
+       YCbCrInput *input = new YCbCrInput(format, ycbcr_format, width, height);
+       input->set_pixel_data(0, y);
+       input->set_pixel_data(1, cb);
+       input->set_pixel_data(2, cr);
+       tester.get_chain()->add_input(input);
+
+       tester.run(out_data, GL_RGBA, COLORSPACE_sRGB, GAMMA_sRGB);
+       expect_equal(expected_data, out_data, 4 * width, height);
+}
+
+TEST(YCbCrConversionEffectTest, LimitedRangeToFullRange) {
+       const int width = 1;
+       const int height = 5;
+
+       // Pure-color test inputs, calculated with the formulas in Rec. 601
+       // section 2.5.4.
+       unsigned char y[width * height] = {
+               16, 235, 81, 145, 41,
+       };
+       unsigned char cb[width * height] = {
+               128, 128, 90, 54, 240,
+       };
+       unsigned char cr[width * height] = {
+               128, 128, 240, 34, 110,
+       };
+       unsigned char expected_data[width * height * 4] = {
+               // Range now from 0-255 for all components, and values in-between
+               // also adjusted a bit.
+                 0, 128, 128, 255,
+               255, 128, 128, 255,
+                76,  85, 255, 255,
+               150,  44,  21, 255,
+                29, 255, 107, 255
+       };
+
+       unsigned char out_data[width * height * 4];
+
+       EffectChainTester tester(NULL, width, height);
+
+       ImageFormat format;
+       format.color_space = COLORSPACE_sRGB;
+       format.gamma_curve = GAMMA_sRGB;
+
+       YCbCrFormat ycbcr_format;
+       ycbcr_format.luma_coefficients = YCBCR_REC_601;
+       ycbcr_format.full_range = true;
+       ycbcr_format.num_levels = 256;
+       ycbcr_format.chroma_subsampling_x = 1;
+       ycbcr_format.chroma_subsampling_y = 1;
+       ycbcr_format.cb_x_position = 0.5f;
+       ycbcr_format.cb_y_position = 0.5f;
+       ycbcr_format.cr_x_position = 0.5f;
+       ycbcr_format.cr_y_position = 0.5f;
+
+       tester.add_ycbcr_output(format, OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED, ycbcr_format);
+
+       ycbcr_format.full_range = false;
+       YCbCrInput *input = new YCbCrInput(format, ycbcr_format, width, height);
+       input->set_pixel_data(0, y);
+       input->set_pixel_data(1, cb);
+       input->set_pixel_data(2, cr);
+       tester.get_chain()->add_input(input);
+
+       tester.run(out_data, GL_RGBA, COLORSPACE_sRGB, GAMMA_sRGB);
+       expect_equal(expected_data, out_data, 4 * width, height);
+}
+
+}  // namespace movit
author	Steinar H. Gunderson <sgunderson@bigfoot.com>
	Wed, 9 Sep 2015 21:51:48 +0000 (23:51 +0200)
committer	Steinar H. Gunderson <sgunderson@bigfoot.com>
	Wed, 9 Sep 2015 21:52:44 +0000 (23:52 +0200)
.gitignore		patch \| blob \| history
Makefile.in		patch \| blob \| history
effect_chain.cpp		patch \| blob \| history
effect_chain.h		patch \| blob \| history
test_util.cpp		patch \| blob \| history
test_util.h		patch \| blob \| history
ycbcr.h		patch \| blob \| history
ycbcr_conversion_effect.cpp	[new file with mode: 0644]	patch \| blob
ycbcr_conversion_effect.frag	[new file with mode: 0644]	patch \| blob
ycbcr_conversion_effect.h	[new file with mode: 0644]	patch \| blob
ycbcr_conversion_effect_test.cpp	[new file with mode: 0644]	patch \| blob