Make sure we do not send infinities to benchmarking textures.

[movit] / ycbcr_input.h
diff --git a/ycbcr_input.h b/ycbcr_input.h

index 2466eedf0307beb7e6f613ea9695cef740d20437..0d24a409342de2e4fbadc2d60f429b801e7620fb 100644 (file)
--- a/ycbcr_input.h
+++ b/ycbcr_input.h
@@ -1,11 +1,24 @@
  #ifndef _MOVIT_YCBCR_INPUT_H
  #define _MOVIT_YCBCR_INPUT_H 1
  
-// YCbCrInput is for handling planar 8-bit Y'CbCr (also sometimes, usually rather
-// imprecisely, called “YUV”), which is typically what you get from a video decoder.
-// It upsamples planes as needed, using the default linear upsampling OpenGL gives you.
-
-#include <GL/glew.h>
+// YCbCrInput is for handling Y'CbCr (also sometimes, usually rather
+// imprecisely, called “YUV”), which is typically what you get from a video
+// decoder. It supports these formats:
+//
+//   * 8-bit planar Y'CbCr, possibly subsampled (e.g. 4:2:0).
+//   * 8-bit semiplanar Y'CbCr (Y' in one plane, CbCr in another),
+//     possibly subsampled.
+//   * 8-bit interleaved (chunked) Y'CbCr, no subsampling (4:4:4 only).
+//   * All of the above in 10- and 12-bit versions, where each sample is
+//     stored in a 16-bit int (so the 6 or 4 top bits are wasted).
+//   * 10-bit interleaved (chunked) Y'CbCr packed into 32-bit words
+//     (10:10:10:2), no subsampling (4:4:4 only).
+//
+// For the planar and semiplanar cases, it upsamples planes as needed, using
+// the default linear upsampling OpenGL gives you. Note that YCbCr422InterleavedInput
+// supports the important special case of 8-bit 4:2:2 interleaved.
+
+#include <epoxy/gl.h>
  #include <assert.h>
  #include <string>
  
@@ -13,51 +26,57 @@
  #include "effect_chain.h"
  #include "image_format.h"
  #include "input.h"
+#include "ycbcr.h"
  
  namespace movit {
  
  class ResourcePool;
  
-struct YCbCrFormat {
-       // Which formula for Y' to use.
-       YCbCrLumaCoefficients luma_coefficients;
-
-       // If true, assume Y'CbCr coefficients are full-range, ie. go from 0 to 255
-       // instead of the limited 220/225 steps in classic MPEG. For instance,
-       // JPEG uses the Rec. 601 luma coefficients, but full range.
-       bool full_range;
-
-       // Sampling factors for chroma components. For no subsampling (4:4:4),
-       // set both to 1.
-       unsigned chroma_subsampling_x, chroma_subsampling_y;
-
-       // Positioning of the chroma samples. MPEG-1 and JPEG is (0.5, 0.5);
-       // MPEG-2 and newer typically are (0.0, 0.5).
-       float cb_x_position, cb_y_position;
-       float cr_x_position, cr_y_position;
+// Whether the data is planar (Y', Cb and Cr in one texture each) or not.
+enum YCbCrInputSplitting {
+       // The standard, default case; Y', Cb and Cr in one texture each.
+       YCBCR_INPUT_PLANAR,
+
+       // Y' in one texture, and then Cb and Cr interleaved in one texture.
+       // In particular, this is a superset of the relatively popular NV12 mode.
+       // If you specify this mode, the “Cr” pointer texture will be unused
+       // (the ”Cb” texture contains both).
+       YCBCR_INPUT_SPLIT_Y_AND_CBCR,
+
+       // Y', Cb and Cr interleaved in the same texture (the “Y” texture;
+       // “Cb” and “Cr” are unused). This means you cannot have any subsampling;
+       // 4:4:4 only.
+       YCBCR_INPUT_INTERLEAVED,
  };
  
  class YCbCrInput : public Input {
  public:
+       // Type can be GL_UNSIGNED_BYTE for 8-bit, GL_UNSIGNED_SHORT for 10- or 12-bit
+       // (or 8-bit, although that's a bit useless), or GL_UNSIGNED_INT_2_10_10_10_REV
+       // for 10-bit (YCBCR_INPUT_INTERLEAVED only).
         YCbCrInput(const ImageFormat &image_format,
                    const YCbCrFormat &ycbcr_format,
-                  unsigned width, unsigned height);
+                  unsigned width, unsigned height,
+                  YCbCrInputSplitting ycbcr_input_splitting = YCBCR_INPUT_PLANAR,
+                  GLenum type = GL_UNSIGNED_BYTE);
         ~YCbCrInput();
  
-       virtual std::string effect_type_id() const { return "YCbCrInput"; }
+       std::string effect_type_id() const override { return "YCbCrInput"; }
  
-       virtual bool can_output_linear_gamma() const { return false; }
-       virtual AlphaHandling alpha_handling() const { return OUTPUT_BLANK_ALPHA; }
+       bool can_output_linear_gamma() const override { return false; }
+       AlphaHandling alpha_handling() const override { return OUTPUT_BLANK_ALPHA; }
  
-       std::string output_fragment_shader();
+       std::string output_fragment_shader() override;
  
         // Uploads the texture if it has changed since last time.
-       void set_gl_state(GLuint glsl_program_num, const std::string& prefix, unsigned *sampler_num);
+       void set_gl_state(GLuint glsl_program_num, const std::string& prefix, unsigned *sampler_num) override;
  
-       unsigned get_width() const { return width; }
-       unsigned get_height() const { return height; }
-       Colorspace get_color_space() const { return image_format.color_space; }
-       GammaCurve get_gamma_curve() const { return image_format.gamma_curve; }
+       unsigned get_width() const override { return width; }
+       unsigned get_height() const override { return height; }
+       Colorspace get_color_space() const override { return image_format.color_space; }
+       GammaCurve get_gamma_curve() const override { return image_format.gamma_curve; }
+       bool can_supply_mipmaps() const override { return ycbcr_input_splitting == YCBCR_INPUT_INTERLEAVED; }
+       bool is_single_texture() const override { return ycbcr_input_splitting == YCBCR_INPUT_INTERLEAVED; }
  
         // Tells the input where to fetch the actual pixel data. Note that if you change
         // this data, you must either call set_pixel_data() again (using the same pointer
@@ -71,35 +90,115 @@ public:
         // the pointer (and PBO, if set) has to be valid at the time of the render call.
         void set_pixel_data(unsigned channel, const unsigned char *pixel_data, GLuint pbo = 0)
         {
-               assert(channel >= 0 && channel < 3);
+               assert(type == GL_UNSIGNED_BYTE || type == GL_UNSIGNED_INT_2_10_10_10_REV);
+               assert(channel >= 0 && channel < num_channels);
                 this->pixel_data[channel] = pixel_data;
                 this->pbos[channel] = pbo;
                 invalidate_pixel_data();
         }
  
+       void set_pixel_data(unsigned channel, const uint16_t *pixel_data, GLuint pbo = 0)
+       {
+               assert(type == GL_UNSIGNED_SHORT);
+               assert(channel >= 0 && channel < num_channels);
+               this->pixel_data[channel] = reinterpret_cast<const unsigned char *>(pixel_data);
+               this->pbos[channel] = pbo;
+               invalidate_pixel_data();
+       }
+
+       void set_pixel_data(unsigned channel, const uint32_t *pixel_data, GLuint pbo = 0)
+       {
+               assert(type == GL_UNSIGNED_INT_2_10_10_10_REV);
+               assert(channel == 0);
+               this->pixel_data[channel] = reinterpret_cast<const unsigned char *>(pixel_data);
+               this->pbos[channel] = pbo;
+               invalidate_pixel_data();
+       }
+
         void invalidate_pixel_data();
  
-       void set_pitch(unsigned channel, unsigned pitch) {
-               assert(channel >= 0 && channel < 3);
+       // Note: Sets pitch to width, so even if your pitch is unchanged,
+       // you will need to re-set it after this call.
+       void set_width(unsigned width)
+       {
+               assert(width != 0);
+               this->width = width;
+
+               assert(width % ycbcr_format.chroma_subsampling_x == 0);
+               pitch[0] = widths[0] = width;
+               pitch[1] = widths[1] = width / ycbcr_format.chroma_subsampling_x;
+               pitch[2] = widths[2] = width / ycbcr_format.chroma_subsampling_x;
+               invalidate_pixel_data();
+       }
+
+       void set_height(unsigned height)
+       {
+               assert(height != 0);
+               this->height = height;
+
+               assert(height % ycbcr_format.chroma_subsampling_y == 0);
+               heights[0] = height;
+               heights[1] = height / ycbcr_format.chroma_subsampling_y;
+               heights[2] = height / ycbcr_format.chroma_subsampling_y;
+               invalidate_pixel_data();
+       }
+
+       void set_pitch(unsigned channel, unsigned pitch)
+       {
+               assert(pitch != 0);
+               assert(channel >= 0 && channel < num_channels);
                 this->pitch[channel] = pitch;
                 invalidate_pixel_data();
         }
  
-       virtual void inform_added(EffectChain *chain)
+       // Tells the input to use the specific OpenGL texture as pixel data for the given
+       // channel. The comments on FlatInput::set_texture_num() also apply here, except
+       // that this input generally does not use mipmaps.
+       void set_texture_num(unsigned channel, GLuint texture_num)
+       {
+               possibly_release_texture(channel);
+               this->texture_num[channel] = texture_num;
+               this->owns_texture[channel] = false;
+       }
+
+       // You can change the Y'CbCr format freely, also after finalize,
+       // although with one limitation: If Cb and Cr come from the same
+       // texture and their offsets offsets are the same (ie., within 1e-6)
+       // when finalizing, they most continue to be so forever, as this
+       // optimization is compiled into the shader.
+       //
+       // If you change subsampling parameters, you'll need to call
+       // set_width() / set_height() again after this.
+       void change_ycbcr_format(const YCbCrFormat &ycbcr_format);
+
+       void inform_added(EffectChain *chain) override
         {
                 resource_pool = chain->get_resource_pool();
         }
  
+       bool set_int(const std::string& key, int value) override;
+
  private:
+       // Release the texture in the given channel if we have any, and it is owned by us.
+       void possibly_release_texture(unsigned channel);
+
         ImageFormat image_format;
         YCbCrFormat ycbcr_format;
+       GLuint num_channels;
+       YCbCrInputSplitting ycbcr_input_splitting;
+       int needs_mipmaps;  // Only allowed if ycbcr_input_splitting == YCBCR_INPUT_INTERLEAVED.
+       GLenum type;
         GLuint pbos[3], texture_num[3];
-
-       int needs_mipmaps;
+       GLint uniform_tex_y, uniform_tex_cb, uniform_tex_cr;
+       Eigen::Matrix3d uniform_ycbcr_matrix;
+       float uniform_offset[3];
+       Point2D uniform_cb_offset, uniform_cr_offset;
+       bool cb_cr_offsets_equal;
  
         unsigned width, height, widths[3], heights[3];
         const unsigned char *pixel_data[3];
         unsigned pitch[3];
+       bool owns_texture[3];
         ResourcePool *resource_pool;
  };