Move chroma subsampling into its own class.

[nageru] / mixer.cpp
diff --git a/mixer.cpp b/mixer.cpp

index d7f86558e16a98d4ada1be0632f9489c3eb9294f..d544b0bf0801ba5208d10ddb0f37b396cd6911a8 100644 (file)
--- a/mixer.cpp
+++ b/mixer.cpp
@@ -3,7 +3,6 @@
  #include "mixer.h"
  
  #include <assert.h>
-#include <endian.h>
  #include <epoxy/egl.h>
  #include <movit/effect_chain.h>
  #include <movit/effect_util.h>
@@ -11,38 +10,42 @@
  #include <movit/image_format.h>
  #include <movit/init.h>
  #include <movit/resource_pool.h>
-#include <movit/util.h>
  #include <stdint.h>
  #include <stdio.h>
  #include <stdlib.h>
  #include <sys/resource.h>
-#include <sys/time.h>
-#include <time.h>
  #include <algorithm>
  #include <chrono>
-#include <cmath>
  #include <condition_variable>
  #include <cstddef>
+#include <cstdint>
  #include <memory>
  #include <mutex>
+#include <ratio>
  #include <string>
  #include <thread>
  #include <utility>
  #include <vector>
  
+#include "DeckLinkAPI.h"
+#include "LinuxCOM.h"
+#include "alsa_output.h"
  #include "bmusb/bmusb.h"
  #include "bmusb/fake_capture.h"
+#include "chroma_subsampler.h"
  #include "context.h"
-#include "db.h"
  #include "decklink_capture.h"
  #include "defs.h"
  #include "disk_space_estimator.h"
  #include "flags.h"
+#include "input_mapping.h"
  #include "pbo_frame_allocator.h"
  #include "ref_counted_gl_sync.h"
+#include "resampling_queue.h"
  #include "timebase.h"
  #include "video_encoder.h"
  
+class IDeckLink;
  class QOpenGLContext;
  
  using namespace movit;
@@ -126,15 +129,15 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
         inout_format.gamma_curve = GAMMA_sRGB;
  
         // Display chain; shows the live output produced by the main chain (its RGBA version).
-       display_chain.reset(new EffectChain(WIDTH, HEIGHT, resource_pool.get()));
+       display_chain.reset(new EffectChain(global_flags.width, global_flags.height, resource_pool.get()));
         check_error();
-       display_input = new FlatInput(inout_format, FORMAT_RGB, GL_UNSIGNED_BYTE, WIDTH, HEIGHT);  // FIXME: GL_UNSIGNED_BYTE is really wrong.
+       display_input = new FlatInput(inout_format, FORMAT_RGB, GL_UNSIGNED_BYTE, global_flags.width, global_flags.height);  // FIXME: GL_UNSIGNED_BYTE is really wrong.
         display_chain->add_input(display_input);
         display_chain->add_output(inout_format, OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED);
         display_chain->set_dither_bits(0);  // Don't bother.
         display_chain->finalize();
  
-       video_encoder.reset(new VideoEncoder(resource_pool.get(), h264_encoder_surface, global_flags.va_display, WIDTH, HEIGHT, &httpd, global_disk_space_estimator));
+       video_encoder.reset(new VideoEncoder(resource_pool.get(), h264_encoder_surface, global_flags.va_display, global_flags.width, global_flags.height, &httpd, global_disk_space_estimator));
  
         // Start listening for clients only once VideoEncoder has written its header, if any.
         httpd.start(9095);
@@ -172,7 +175,7 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
  
         unsigned num_fake_cards = 0;
         for ( ; card_index < num_cards; ++card_index, ++num_fake_cards) {
-               FakeCapture *capture = new FakeCapture(WIDTH, HEIGHT, FAKE_FPS, OUTPUT_FREQUENCY, card_index, global_flags.fake_cards_audio);
+               FakeCapture *capture = new FakeCapture(global_flags.width, global_flags.height, FAKE_FPS, OUTPUT_FREQUENCY, card_index, global_flags.fake_cards_audio);
                 configure_card(card_index, capture, /*is_fake_capture=*/true);
         }
  
@@ -183,53 +186,11 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
         BMUSBCapture::set_card_connected_callback(bind(&Mixer::bm_hotplug_add, this, _1));
         BMUSBCapture::start_bm_thread();
  
-       for (card_index = 0; card_index < num_cards; ++card_index) {
+       for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
                 cards[card_index].queue_length_policy.reset(card_index);
-               cards[card_index].capture->start_bm_capture();
         }
  
-       // Set up stuff for NV12 conversion.
-
-       // Cb/Cr shader.
-       string cbcr_vert_shader =
-               "#version 130 \n"
-               " \n"
-               "in vec2 position; \n"
-               "in vec2 texcoord; \n"
-               "out vec2 tc0; \n"
-               "uniform vec2 foo_chroma_offset_0; \n"
-               " \n"
-               "void main() \n"
-               "{ \n"
-               "    // The result of glOrtho(0.0, 1.0, 0.0, 1.0, 0.0, 1.0) is: \n"
-               "    // \n"
-               "    //   2.000  0.000  0.000 -1.000 \n"
-               "    //   0.000  2.000  0.000 -1.000 \n"
-               "    //   0.000  0.000 -2.000 -1.000 \n"
-               "    //   0.000  0.000  0.000  1.000 \n"
-               "    gl_Position = vec4(2.0 * position.x - 1.0, 2.0 * position.y - 1.0, -1.0, 1.0); \n"
-               "    vec2 flipped_tc = texcoord; \n"
-               "    tc0 = flipped_tc + foo_chroma_offset_0; \n"
-               "} \n";
-       string cbcr_frag_shader =
-               "#version 130 \n"
-               "in vec2 tc0; \n"
-               "uniform sampler2D cbcr_tex; \n"
-               "out vec4 FragColor; \n"
-               "void main() { \n"
-               "    FragColor = texture(cbcr_tex, tc0); \n"
-               "} \n";
-       vector<string> frag_shader_outputs;
-       cbcr_program_num = resource_pool->compile_glsl_program(cbcr_vert_shader, cbcr_frag_shader, frag_shader_outputs);
-
-       float vertices[] = {
-               0.0f, 2.0f,
-               0.0f, 0.0f,
-               2.0f, 0.0f
-       };
-       cbcr_vbo = generate_vbo(2, GL_FLOAT, sizeof(vertices), vertices);
-       cbcr_position_attribute_index = glGetAttribLocation(cbcr_program_num, "position");
-       cbcr_texcoord_attribute_index = glGetAttribLocation(cbcr_program_num, "texcoord");
+       chroma_subsampler.reset(new ChromaSubsampler(resource_pool.get()));
  
         if (global_flags.enable_alsa_output) {
                 alsa.reset(new ALSAOutput(OUTPUT_FREQUENCY, /*num_channels=*/2));
@@ -238,8 +199,6 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
  
  Mixer::~Mixer()
  {
-       resource_pool->release_glsl_program(cbcr_program_num);
-       glDeleteBuffers(1, &cbcr_vbo);
         BMUSBCapture::stop_bm_thread();
  
         for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
@@ -267,20 +226,19 @@ void Mixer::configure_card(unsigned card_index, CaptureInterface *capture, bool
         card->is_fake_capture = is_fake_capture;
         card->capture->set_frame_callback(bind(&Mixer::bm_frame, this, card_index, _1, _2, _3, _4, _5, _6, _7));
         if (card->frame_allocator == nullptr) {
-               card->frame_allocator.reset(new PBOFrameAllocator(8 << 20, WIDTH, HEIGHT));  // 8 MB.
+               card->frame_allocator.reset(new PBOFrameAllocator(8 << 20, global_flags.width, global_flags.height));  // 8 MB.
         }
         card->capture->set_video_frame_allocator(card->frame_allocator.get());
         if (card->surface == nullptr) {
                 card->surface = create_surface_with_same_format(mixer_surface);
         }
         while (!card->new_frames.empty()) card->new_frames.pop();
-       card->fractional_samples = 0;
         card->last_timecode = -1;
         card->capture->configure_card();
  
         DeviceSpec device{InputSourceType::CAPTURE_CARD, card_index};
         audio_mixer.reset_resampler(device);
-       audio_mixer.set_name(device, card->capture->get_description());
+       audio_mixer.set_display_name(device, card->capture->get_description());
         audio_mixer.trigger_state_changed_callback();
  }
  
@@ -508,6 +466,7 @@ void Mixer::bm_frame(unsigned card_index, uint16_t timecode,
                         new_frame.interlaced = video_format.interlaced;
                         new_frame.upload_func = upload_func;
                         new_frame.dropped_frames = dropped_frames;
+                       new_frame.received_timestamp = video_frame.received_timestamp;  // Ignore the audio timestamp.
                         card->new_frames.push(move(new_frame));
                         card->new_frames_changed.notify_all();
                 }
@@ -534,6 +493,12 @@ void Mixer::thread_func()
                 exit(1);
         }
  
+       // Start the actual capture. (We don't want to do it before we're actually ready
+       // to process output frames.)
+       for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
+               cards[card_index].capture->start_bm_capture();
+       }
+
         steady_clock::time_point start, now;
         start = steady_clock::now();
  
@@ -543,14 +508,13 @@ void Mixer::thread_func()
         while (!should_quit) {
                 CaptureCard::NewFrame new_frames[MAX_VIDEO_CARDS];
                 bool has_new_frame[MAX_VIDEO_CARDS] = { false };
-               int num_samples[MAX_VIDEO_CARDS] = { 0 };
  
                 unsigned master_card_index = theme->map_signal(master_clock_channel);
                 assert(master_card_index < num_cards);
  
-               get_one_frame_from_each_card(master_card_index, new_frames, has_new_frame, num_samples);
-               schedule_audio_resampling_tasks(new_frames[master_card_index].dropped_frames, num_samples[master_card_index], new_frames[master_card_index].length);
-               stats_dropped_frames += new_frames[master_card_index].dropped_frames;
+               OutputFrameInfo output_frame_info = get_one_frame_from_each_card(master_card_index, new_frames, has_new_frame);
+               schedule_audio_resampling_tasks(output_frame_info.dropped_frames, output_frame_info.num_samples, output_frame_info.frame_duration);
+               stats_dropped_frames += output_frame_info.dropped_frames;
  
                 handle_hotplugged_cards();
  
@@ -591,7 +555,7 @@ void Mixer::thread_func()
                         }
                 }
  
-               int64_t frame_duration = new_frames[master_card_index].length;
+               int64_t frame_duration = output_frame_info.frame_duration;
                 render_one_frame(frame_duration);
                 ++frame;
                 pts_int += frame_duration;
@@ -619,10 +583,15 @@ void Mixer::thread_func()
                                         assert(false);
                                 }
  
-                               printf(", using %ld / %ld MB lockable memory (%.1f%%)",
-                                       long(used.ru_maxrss / 1024),
-                                       long(limit.rlim_cur / 1048576),
-                                       float(100.0 * (used.ru_maxrss * 1024.0) / limit.rlim_cur));
+                               if (limit.rlim_cur == 0) {
+                                       printf(", using %ld MB memory (locked)",
+                                               long(used.ru_maxrss / 1024));
+                               } else {
+                                       printf(", using %ld / %ld MB lockable memory (%.1f%%)",
+                                               long(used.ru_maxrss / 1024),
+                                               long(limit.rlim_cur / 1048576),
+                                               float(100.0 * (used.ru_maxrss * 1024.0) / limit.rlim_cur));
+                               }
                         } else {
                                 printf(", using %ld MB memory (not locked)",
                                         long(used.ru_maxrss / 1024));
@@ -652,8 +621,10 @@ void Mixer::thread_func()
         resource_pool->clean_context();
  }
  
-void Mixer::get_one_frame_from_each_card(unsigned master_card_index, CaptureCard::NewFrame new_frames[MAX_VIDEO_CARDS], bool has_new_frame[MAX_VIDEO_CARDS], int num_samples[MAX_VIDEO_CARDS])
+Mixer::OutputFrameInfo Mixer::get_one_frame_from_each_card(unsigned master_card_index, CaptureCard::NewFrame new_frames[MAX_VIDEO_CARDS], bool has_new_frame[MAX_VIDEO_CARDS])
  {
+       OutputFrameInfo output_frame_info;
+
  start:
         // The first card is the master timer, so wait for it to have a new frame.
         // TODO: Add a timeout.
@@ -680,11 +651,6 @@ start:
                 card->new_frames.pop();
                 card->new_frames_changed.notify_all();
  
-               int num_samples_times_timebase = OUTPUT_FREQUENCY * new_frames[card_index].length + card->fractional_samples;
-               num_samples[card_index] = num_samples_times_timebase / TIMEBASE;
-               card->fractional_samples = num_samples_times_timebase % TIMEBASE;
-               assert(num_samples[card_index] >= 0);
-
                 if (card_index == master_card_index) {
                         // We don't use the queue length policy for the master card,
                         // but we will if it stops being the master. Thus, clear out
@@ -699,6 +665,18 @@ start:
                         }
                 }
         }
+
+       output_frame_info.dropped_frames = new_frames[master_card_index].dropped_frames;
+       output_frame_info.frame_duration = new_frames[master_card_index].length;
+
+       // This might get off by a fractional sample when changing master card
+       // between ones with different frame rates, but that's fine.
+       int num_samples_times_timebase = OUTPUT_FREQUENCY * output_frame_info.frame_duration + fractional_samples;
+       output_frame_info.num_samples = num_samples_times_timebase / TIMEBASE;
+       fractional_samples = num_samples_times_timebase % TIMEBASE;
+       assert(output_frame_info.num_samples >= 0);
+
+       return output_frame_info;
  }
  
  void Mixer::handle_hotplugged_cards()
@@ -708,7 +686,7 @@ void Mixer::handle_hotplugged_cards()
                 CaptureCard *card = &cards[card_index];
                 if (card->capture->get_disconnected()) {
                         fprintf(stderr, "Card %u went away, replacing with a fake card.\n", card_index);
-                       FakeCapture *capture = new FakeCapture(WIDTH, HEIGHT, FAKE_FPS, OUTPUT_FREQUENCY, card_index, global_flags.fake_cards_audio);
+                       FakeCapture *capture = new FakeCapture(global_flags.width, global_flags.height, FAKE_FPS, OUTPUT_FREQUENCY, card_index, global_flags.fake_cards_audio);
                         configure_card(card_index, capture, /*is_fake_capture=*/true);
                         card->queue_length_policy.reset(card_index);
                         card->capture->start_bm_capture();
@@ -785,7 +763,7 @@ void Mixer::schedule_audio_resampling_tasks(unsigned dropped_frames, int num_sam
  void Mixer::render_one_frame(int64_t duration)
  {
         // Get the main chain from the theme, and set its state immediately.
-       Theme::Chain theme_main_chain = theme->get_chain(0, pts(), WIDTH, HEIGHT, input_state);
+       Theme::Chain theme_main_chain = theme->get_chain(0, pts(), global_flags.width, global_flags.height, input_state);
         EffectChain *chain = theme_main_chain.chain;
         theme_main_chain.setup_chain();
         //theme_main_chain.chain->enable_phase_timing(true);
@@ -795,14 +773,14 @@ void Mixer::render_one_frame(int64_t duration)
         assert(got_frame);
  
         // Render main chain.
-       GLuint cbcr_full_tex = resource_pool->create_2d_texture(GL_RG8, WIDTH, HEIGHT);
-       GLuint rgba_tex = resource_pool->create_2d_texture(GL_RGB565, WIDTH, HEIGHT);  // Saves texture bandwidth, although dithering gets messed up.
+       GLuint cbcr_full_tex = resource_pool->create_2d_texture(GL_RG8, global_flags.width, global_flags.height);
+       GLuint rgba_tex = resource_pool->create_2d_texture(GL_RGB565, global_flags.width, global_flags.height);  // Saves texture bandwidth, although dithering gets messed up.
         GLuint fbo = resource_pool->create_fbo(y_tex, cbcr_full_tex, rgba_tex);
         check_error();
-       chain->render_to_fbo(fbo, WIDTH, HEIGHT);
+       chain->render_to_fbo(fbo, global_flags.width, global_flags.height);
         resource_pool->release_fbo(fbo);
  
-       subsample_chroma(cbcr_full_tex, cbcr_tex);
+       chroma_subsampler->subsample_chroma(cbcr_full_tex, global_flags.width, global_flags.height, cbcr_tex);
         resource_pool->release_2d_texture(cbcr_full_tex);
  
         // Set the right state for rgba_tex.
@@ -812,7 +790,7 @@ void Mixer::render_one_frame(int64_t duration)
         glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
         glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE);
  
-       const int64_t av_delay = TIMEBASE / 10;  // Corresponds to the fixed delay in resampling_queue.h. TODO: Make less hard-coded.
+       const int64_t av_delay = lrint(global_flags.audio_queue_length_ms * 0.001 * TIMEBASE);  // Corresponds to the delay in ResamplingQueue.
         RefCountedGLsync fence = video_encoder->end_frame(pts_int + av_delay, duration, theme_main_chain.input_frames);
  
         // The live frame just shows the RGBA texture we just rendered.
@@ -830,7 +808,7 @@ void Mixer::render_one_frame(int64_t duration)
         // Set up preview and any additional channels.
         for (int i = 1; i < theme->get_num_channels() + 2; ++i) {
                 DisplayFrame display_frame;
-               Theme::Chain chain = theme->get_chain(i, pts(), WIDTH, HEIGHT, input_state);  // FIXME: dimensions
+               Theme::Chain chain = theme->get_chain(i, pts(), global_flags.width, global_flags.height, input_state);  // FIXME: dimensions
                 display_frame.chain = chain.chain;
                 display_frame.setup_chain = chain.setup_chain;
                 display_frame.ready_fence = fence;
@@ -857,75 +835,20 @@ void Mixer::audio_thread_func()
  
                 ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy =
                         task.adjust_rate ? ResamplingQueue::ADJUST_RATE : ResamplingQueue::DO_NOT_ADJUST_RATE;
-               vector<float> samples_out = audio_mixer.get_output(double(task.pts_int) / TIMEBASE, task.num_samples, rate_adjustment_policy);
+               vector<float> samples_out = audio_mixer.get_output(
+                       double(task.pts_int) / TIMEBASE,
+                       task.num_samples,
+                       rate_adjustment_policy);
  
                 // Send the samples to the sound card, then add them to the output.
                 if (alsa) {
                         alsa->write(samples_out);
                 }
+               decklink_output->send_audio(task.pts_int, samples_out);
                 video_encoder->add_audio(task.pts_int, move(samples_out));
         }
  }
  
-void Mixer::subsample_chroma(GLuint src_tex, GLuint dst_tex)
-{
-       GLuint vao;
-       glGenVertexArrays(1, &vao);
-       check_error();
-
-       glBindVertexArray(vao);
-       check_error();
-
-       // Extract Cb/Cr.
-       GLuint fbo = resource_pool->create_fbo(dst_tex);
-       glBindFramebuffer(GL_FRAMEBUFFER, fbo);
-       glViewport(0, 0, WIDTH/2, HEIGHT/2);
-       check_error();
-
-       glUseProgram(cbcr_program_num);
-       check_error();
-
-       glActiveTexture(GL_TEXTURE0);
-       check_error();
-       glBindTexture(GL_TEXTURE_2D, src_tex);
-       check_error();
-       glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR);
-       check_error();
-       glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
-       check_error();
-       glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE);
-       check_error();
-
-       float chroma_offset_0[] = { -0.5f / WIDTH, 0.0f };
-       set_uniform_vec2(cbcr_program_num, "foo", "chroma_offset_0", chroma_offset_0);
-
-       glBindBuffer(GL_ARRAY_BUFFER, cbcr_vbo);
-       check_error();
-
-       for (GLint attr_index : { cbcr_position_attribute_index, cbcr_texcoord_attribute_index }) {
-               glEnableVertexAttribArray(attr_index);
-               check_error();
-               glVertexAttribPointer(attr_index, 2, GL_FLOAT, GL_FALSE, 0, BUFFER_OFFSET(0));
-               check_error();
-       }
-
-       glDrawArrays(GL_TRIANGLES, 0, 3);
-       check_error();
-
-       for (GLint attr_index : { cbcr_position_attribute_index, cbcr_texcoord_attribute_index }) {
-               glDisableVertexAttribArray(attr_index);
-               check_error();
-       }
-
-       glUseProgram(0);
-       check_error();
-       glBindFramebuffer(GL_FRAMEBUFFER, 0);
-       check_error();
-
-       resource_pool->release_fbo(fbo);
-       glDeleteVertexArrays(1, &vao);
-}
-
  void Mixer::release_display_frame(DisplayFrame *frame)
  {
         for (GLuint texnum : frame->temp_textures) {