Move the R128 and correlation measurements into AudioMixer.

author Steinar H. Gunderson <sgunderson@bigfoot.com>

Sat, 13 Aug 2016 17:22:07 +0000 (19:22 +0200)

committer Steinar H. Gunderson <sgunderson@bigfoot.com>

Wed, 19 Oct 2016 22:55:44 +0000 (00:55 +0200)
author Steinar H. Gunderson <sgunderson@bigfoot.com>
Sat, 13 Aug 2016 17:22:07 +0000 (19:22 +0200)
committer Steinar H. Gunderson <sgunderson@bigfoot.com>
Wed, 19 Oct 2016 22:55:44 +0000 (00:55 +0200)
diff --git a/audio_mixer.cpp b/audio_mixer.cpp

index 1c570fa870468e54134ac892c5eac016372754ce..5a7804582ce591f4b80432fe418c01ebe2c7c4e7 100644 (file)
--- a/audio_mixer.cpp
+++ b/audio_mixer.cpp
@@ -77,13 +77,38 @@ void convert_fixed32_to_fp32(float *dst, size_t out_channel, size_t out_num_chan
         }
  }
  
+float find_peak(const float *samples, size_t num_samples)
+{
+       float m = fabs(samples[0]);
+       for (size_t i = 1; i < num_samples; ++i) {
+               m = max(m, fabs(samples[i]));
+       }
+       return m;
+}
+
+void deinterleave_samples(const vector<float> &in, vector<float> *out_l, vector<float> *out_r)
+{
+       size_t num_samples = in.size() / 2;
+       out_l->resize(num_samples);
+       out_r->resize(num_samples);
+
+       const float *inptr = in.data();
+       float *lptr = &(*out_l)[0];
+       float *rptr = &(*out_r)[0];
+       for (size_t i = 0; i < num_samples; ++i) {
+               *lptr++ = *inptr++;
+               *rptr++ = *inptr++;
+       }
+}
+
  }  // namespace
  
  AudioMixer::AudioMixer(unsigned num_cards)
         : num_cards(num_cards),
           level_compressor(OUTPUT_FREQUENCY),
           limiter(OUTPUT_FREQUENCY),
-         compressor(OUTPUT_FREQUENCY)
+         compressor(OUTPUT_FREQUENCY),
+         correlation(OUTPUT_FREQUENCY)
  {
         locut.init(FILTER_HPF, 2);
  
@@ -108,6 +133,13 @@ AudioMixer::AudioMixer(unsigned num_cards)
  
         // Look for ALSA cards.
         available_alsa_cards = ALSAInput::enumerate_devices();
+
+       r128.init(2, OUTPUT_FREQUENCY);
+       r128.integr_start();
+
+       // hlen=16 is pretty low quality, but we use quite a bit of CPU otherwise,
+       // and there's a limit to how important the peak meter is.
+       peak_resampler.setup(OUTPUT_FREQUENCY, OUTPUT_FREQUENCY * 4, /*num_channels=*/2, /*hlen=*/16, /*frel=*/1.0);
  }
  
  AudioMixer::~AudioMixer()
@@ -418,7 +450,7 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
         // Note that there's a feedback loop here, so we choose a very slow filter
         // (half-time of 30 seconds).
         double target_loudness_factor, alpha;
-       double loudness_lu = loudness_lufs - ref_level_lufs;
+       double loudness_lu = r128.loudness_M() - ref_level_lufs;
         double current_makeup_lu = to_db(final_makeup_gain);
         target_loudness_factor = final_makeup_gain * from_db(-loudness_lu);
  
@@ -446,9 +478,74 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
                 final_makeup_gain = m;
         }
  
+       update_meters(samples_out);
+
         return samples_out;
  }
  
+void AudioMixer::update_meters(const vector<float> &samples)
+{
+       // Upsample 4x to find interpolated peak.
+       peak_resampler.inp_data = const_cast<float *>(samples.data());
+       peak_resampler.inp_count = samples.size() / 2;
+
+       vector<float> interpolated_samples;
+       interpolated_samples.resize(samples.size());
+       {
+               unique_lock<mutex> lock(audio_measure_mutex);
+
+               while (peak_resampler.inp_count > 0) {  // About four iterations.
+                       peak_resampler.out_data = &interpolated_samples[0];
+                       peak_resampler.out_count = interpolated_samples.size() / 2;
+                       peak_resampler.process();
+                       size_t out_stereo_samples = interpolated_samples.size() / 2 - peak_resampler.out_count;
+                       peak = max<float>(peak, find_peak(interpolated_samples.data(), out_stereo_samples * 2));
+                       peak_resampler.out_data = nullptr;
+               }
+       }
+
+       // Find R128 levels and L/R correlation.
+       vector<float> left, right;
+       deinterleave_samples(samples, &left, &right);
+       float *ptrs[] = { left.data(), right.data() };
+       {
+               unique_lock<mutex> lock(audio_measure_mutex);
+               r128.process(left.size(), ptrs);
+               correlation.process_samples(samples);
+       }
+
+       send_audio_level_callback();
+}
+
+void AudioMixer::reset_meters()
+{
+       unique_lock<mutex> lock(audio_measure_mutex);
+       peak_resampler.reset();
+       peak = 0.0f;
+       r128.reset();
+       r128.integr_start();
+       correlation.reset();
+}
+
+void AudioMixer::send_audio_level_callback()
+{
+       if (audio_level_callback == nullptr) {
+               return;
+       }
+
+       unique_lock<mutex> lock(audio_measure_mutex);
+       double loudness_s = r128.loudness_S();
+       double loudness_i = r128.integrated();
+       double loudness_range_low = r128.range_min();
+       double loudness_range_high = r128.range_max();
+
+       audio_level_callback(loudness_s, to_db(peak),
+               loudness_i, loudness_range_low, loudness_range_high,
+               gain_staging_db,
+               to_db(final_makeup_gain),
+               correlation.get_correlation());
+}
+
  map<DeviceSpec, DeviceInfo> AudioMixer::get_devices() const
  {
         lock_guard<timed_mutex> lock(audio_mutex);
diff --git a/audio_mixer.h b/audio_mixer.h

index 6e1d5a9458fbb1ef3d808d7cae162591a2ae878d..75b468a120f7d1f39aa293009e9b76153ae4e9a3 100644 (file)
--- a/audio_mixer.h
+++ b/audio_mixer.h
@@ -7,9 +7,6 @@
  // all together into one final audio signal.
  //
  // All operations on AudioMixer (except destruction) are thread-safe.
-//
-// TODO: There might be more audio stuff that should be moved here
-// from Mixer.
  
  #include <math.h>
  #include <stdint.h>
@@ -19,11 +16,14 @@
  #include <mutex>
  #include <set>
  #include <vector>
+#include <zita-resampler/resampler.h>
  
  #include "alsa_input.h"
  #include "bmusb/bmusb.h"
+#include "correlation_measurer.h"
  #include "db.h"
  #include "defs.h"
+#include "ebu_r128_proc.h"
  #include "filter.h"
  #include "resampling_queue.h"
  #include "stereocompressor.h"
@@ -77,6 +77,7 @@ public:
         AudioMixer(unsigned num_cards);
         ~AudioMixer();
         void reset_resampler(DeviceSpec device_spec);
+       void reset_meters();
  
         // Add audio (or silence) to the given device's queue. Can return false if
         // the lock wasn't successfully taken; if so, you should simply try again.
@@ -88,9 +89,6 @@ public:
  
         std::vector<float> get_output(double pts, unsigned num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy);
  
-       // See comments inside get_output().
-       void set_current_loudness(double level_lufs) { loudness_lufs = level_lufs; }
-
         void set_fader_volume(unsigned bus_index, float level_db) { fader_volume_db[bus_index] = level_db; }
         std::map<DeviceSpec, DeviceInfo> get_devices() const;
         void set_name(DeviceSpec device_spec, const std::string &name);
@@ -203,6 +201,15 @@ public:
                 return final_makeup_gain_auto;
         }
  
+       typedef std::function<void(float level_lufs, float peak_db,
+                                  float global_level_lufs, float range_low_lufs, float range_high_lufs,
+                                  float gain_staging_db, float final_makeup_gain_db,
+                                  float correlation)> audio_level_callback_t;
+       void set_audio_level_callback(audio_level_callback_t callback)
+       {
+               audio_level_callback = callback;
+       }
+
  private:
         struct AudioDevice {
                 std::unique_ptr<ResamplingQueue> resampling_queue;
@@ -221,6 +228,8 @@ private:
         void reset_resampler_mutex_held(DeviceSpec device_spec);
         void reset_alsa_mutex_held(DeviceSpec device_spec);
         std::map<DeviceSpec, DeviceInfo> get_devices_mutex_held() const;
+       void update_meters(const std::vector<float> &samples);
+       void send_audio_level_callback();
  
         unsigned num_cards;
  
@@ -245,8 +254,6 @@ private:
         static constexpr float ref_level_dbfs = -14.0f;  // Chosen so that we end up around 0 LU in practice.
         static constexpr float ref_level_lufs = -23.0f;  // 0 LU, more or less by definition.
  
-       std::atomic<float> loudness_lufs{ref_level_lufs};
-
         StereoCompressor limiter;
         std::atomic<float> limiter_threshold_dbfs{ref_level_dbfs + 4.0f};   // 4 dB.
         std::atomic<bool> limiter_enabled{true};
@@ -259,6 +266,13 @@ private:
  
         InputMapping input_mapping;  // Under audio_mutex.
         std::atomic<float> fader_volume_db[MAX_BUSES] {{ 0.0f }};
+
+       audio_level_callback_t audio_level_callback = nullptr;
+       mutable std::mutex audio_measure_mutex;
+       Ebu_r128_proc r128;  // Under audio_measure_mutex.
+       CorrelationMeasurer correlation;  // Under audio_measure_mutex.
+       Resampler peak_resampler;  // Under audio_measure_mutex.
+       std::atomic<float> peak{0.0f};
  };
  
  #endif  // !defined(_AUDIO_MIXER_H)
diff --git a/mainwindow.cpp b/mainwindow.cpp

index 5eb631a8890efa2ba9131c5c298657821671a3e0..28f0393fce2c4a20e1ef50a180cb8314cc57a1ae 100644 (file)
--- a/mainwindow.cpp
+++ b/mainwindow.cpp
@@ -217,7 +217,7 @@ void MainWindow::mixer_created(Mixer *mixer)
                 global_mixer->get_audio_mixer()->set_compressor_enabled(state == Qt::Checked);
         });
         connect(ui->reset_meters_button, &QPushButton::clicked, this, &MainWindow::reset_meters_button_clicked);
-       mixer->set_audio_level_callback(bind(&MainWindow::audio_level_callback, this, _1, _2, _3, _4, _5, _6, _7, _8));
+       mixer->get_audio_mixer()->set_audio_level_callback(bind(&MainWindow::audio_level_callback, this, _1, _2, _3, _4, _5, _6, _7, _8));
  
         struct sigaction act;
         memset(&act, 0, sizeof(act));
@@ -391,7 +391,7 @@ void MainWindow::mini_fader_changed(Ui::AudioMiniView *ui, int channel, int valu
  
  void MainWindow::reset_meters_button_clicked()
  {
-       global_mixer->reset_meters();
+       global_mixer->get_audio_mixer()->reset_meters();
         ui->peak_display->setText(QString::fromStdString(format_db(-HUGE_VAL, DB_WITH_SIGN | DB_BARE)));
         ui->peak_display->setStyleSheet("");
  }
diff --git a/mixer.cpp b/mixer.cpp

index 38578f90ea7b85609531a63d5bc1bc3806a983b7..00f161a1052bcc7077951459282024be2999c5ba 100644 (file)
--- a/mixer.cpp
+++ b/mixer.cpp
@@ -105,8 +105,7 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
           num_cards(num_cards),
           mixer_surface(create_surface(format)),
           h264_encoder_surface(create_surface(format)),
-         audio_mixer(num_cards),
-         correlation(OUTPUT_FREQUENCY)
+         audio_mixer(num_cards)
  {
         CHECK(init_movit(MOVIT_SHADER_DIR, MOVIT_DEBUG_OFF));
         check_error();
@@ -232,13 +231,6 @@ Mixer::Mixer(const QSurfaceFormat &format, unsigned num_cards)
         cbcr_position_attribute_index = glGetAttribLocation(cbcr_program_num, "position");
         cbcr_texcoord_attribute_index = glGetAttribLocation(cbcr_program_num, "texcoord");
  
-       r128.init(2, OUTPUT_FREQUENCY);
-       r128.integr_start();
-
-       // hlen=16 is pretty low quality, but we use quite a bit of CPU otherwise,
-       // and there's a limit to how important the peak meter is.
-       peak_resampler.setup(OUTPUT_FREQUENCY, OUTPUT_FREQUENCY * 4, /*num_channels=*/2, /*hlen=*/16, /*frel=*/1.0);
-
         if (global_flags.enable_alsa_output) {
                 alsa.reset(new ALSAOutput(OUTPUT_FREQUENCY, /*num_channels=*/2));
         }
@@ -304,30 +296,6 @@ int unwrap_timecode(uint16_t current_wrapped, int last)
         }
  }
  
-float find_peak(const float *samples, size_t num_samples)
-{
-       float m = fabs(samples[0]);
-       for (size_t i = 1; i < num_samples; ++i) {
-               m = max(m, fabs(samples[i]));
-       }
-       return m;
-}
-
-void deinterleave_samples(const vector<float> &in, vector<float> *out_l, vector<float> *out_r)
-{
-       size_t num_samples = in.size() / 2;
-       out_l->resize(num_samples);
-       out_r->resize(num_samples);
-
-       const float *inptr = in.data();
-       float *lptr = &(*out_l)[0];
-       float *rptr = &(*out_r)[0];
-       for (size_t i = 0; i < num_samples; ++i) {
-               *lptr++ = *inptr++;
-               *rptr++ = *inptr++;
-       }
-}
-
  }  // namespace
  
  void Mixer::bm_frame(unsigned card_index, uint16_t timecode,
@@ -582,7 +550,6 @@ void Mixer::thread_func()
                 get_one_frame_from_each_card(master_card_index, new_frames, has_new_frame, num_samples);
                 schedule_audio_resampling_tasks(new_frames[master_card_index].dropped_frames, num_samples[master_card_index], new_frames[master_card_index].length);
                 stats_dropped_frames += new_frames[master_card_index].dropped_frames;
-               send_audio_level_callback();
  
                 handle_hotplugged_cards();
  
@@ -872,25 +839,6 @@ void Mixer::render_one_frame(int64_t duration)
         }
  }
  
-void Mixer::send_audio_level_callback()
-{
-       if (audio_level_callback == nullptr) {
-               return;
-       }
-
-       unique_lock<mutex> lock(audio_measure_mutex);
-       double loudness_s = r128.loudness_S();
-       double loudness_i = r128.integrated();
-       double loudness_range_low = r128.range_min();
-       double loudness_range_high = r128.range_max();
-
-       audio_level_callback(loudness_s, to_db(peak),
-               loudness_i, loudness_range_low, loudness_range_high,
-               audio_mixer.get_gain_staging_db(),
-               audio_mixer.get_final_makeup_gain_db(),
-               correlation.get_correlation());
-}
-
  void Mixer::audio_thread_func()
  {
         while (!should_quit) {
@@ -908,51 +856,14 @@ void Mixer::audio_thread_func()
  
                 ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy =
                         task.adjust_rate ? ResamplingQueue::ADJUST_RATE : ResamplingQueue::DO_NOT_ADJUST_RATE;
-               process_audio_one_frame(task.pts_int, task.num_samples, rate_adjustment_policy);
-       }
-}
-
-void Mixer::process_audio_one_frame(int64_t frame_pts_int, int num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy)
-{
-       vector<float> samples_out = audio_mixer.get_output(double(frame_pts_int) / TIMEBASE, num_samples, rate_adjustment_policy);
+               vector<float> samples_out = audio_mixer.get_output(double(task.pts_int) / TIMEBASE, task.num_samples, rate_adjustment_policy);
  
-       // Upsample 4x to find interpolated peak.
-       peak_resampler.inp_data = samples_out.data();
-       peak_resampler.inp_count = samples_out.size() / 2;
-
-       vector<float> interpolated_samples_out;
-       interpolated_samples_out.resize(samples_out.size());
-       {
-               unique_lock<mutex> lock(audio_measure_mutex);
-
-               while (peak_resampler.inp_count > 0) {  // About four iterations.
-                       peak_resampler.out_data = &interpolated_samples_out[0];
-                       peak_resampler.out_count = interpolated_samples_out.size() / 2;
-                       peak_resampler.process();
-                       size_t out_stereo_samples = interpolated_samples_out.size() / 2 - peak_resampler.out_count;
-                       peak = max<float>(peak, find_peak(interpolated_samples_out.data(), out_stereo_samples * 2));
-                       peak_resampler.out_data = nullptr;
+               // Send the samples to the sound card, then add them to the output.
+               if (alsa) {
+                       alsa->write(samples_out);
                 }
+               video_encoder->add_audio(task.pts_int, move(samples_out));
         }
-
-       // Find R128 levels and L/R correlation.
-       vector<float> left, right;
-       deinterleave_samples(samples_out, &left, &right);
-       float *ptrs[] = { left.data(), right.data() };
-       {
-               unique_lock<mutex> lock(audio_measure_mutex);
-               r128.process(left.size(), ptrs);
-               audio_mixer.set_current_loudness(r128.loudness_M());
-               correlation.process_samples(samples_out);
-       }
-
-       // Send the samples to the sound card.
-       if (alsa) {
-               alsa->write(samples_out);
-       }
-
-       // And finally add them to the output.
-       video_encoder->add_audio(frame_pts_int, move(samples_out));
  }
  
  void Mixer::subsample_chroma(GLuint src_tex, GLuint dst_tex)
@@ -1048,16 +959,6 @@ void Mixer::channel_clicked(int preview_num)
         theme->channel_clicked(preview_num);
  }
  
-void Mixer::reset_meters()
-{
-       unique_lock<mutex> lock(audio_measure_mutex);
-       peak_resampler.reset();
-       peak = 0.0f;
-       r128.reset();
-       r128.integr_start();
-       correlation.reset();
-}
-
  void Mixer::start_mode_scanning(unsigned card_index)
  {
         assert(card_index < num_cards);
diff --git a/mixer.h b/mixer.h

index 354735da57d9e7a6880a18a6bab5f7cc3350ccbb..5c69edd4450ac4922b30ac05b52a6413c6fe2084 100644 (file)
--- a/mixer.h
+++ b/mixer.h
@@ -11,7 +11,6 @@
  #include <movit/flat_input.h>
  #include <stdbool.h>
  #include <stdint.h>
-#include <zita-resampler/resampler.h>
  
  #include <atomic>
  #include <chrono>
@@ -29,9 +28,7 @@
  #include "alsa_output.h"
  #include "audio_mixer.h"
  #include "bmusb/bmusb.h"
-#include "correlation_measurer.h"
  #include "defs.h"
-#include "ebu_r128_proc.h"
  #include "httpd.h"
  #include "input_state.h"
  #include "pbo_frame_allocator.h"
@@ -172,15 +169,6 @@ public:
                 output_channel[output].set_color_updated_callback(callback);
         }
  
-       typedef std::function<void(float level_lufs, float peak_db,
-                                  float global_level_lufs, float range_low_lufs, float range_high_lufs,
-                                  float gain_staging_db, float final_makeup_gain_db,
-                                  float correlation)> audio_level_callback_t;
-       void set_audio_level_callback(audio_level_callback_t callback)
-       {
-               audio_level_callback = callback;
-       }
-
         std::vector<std::string> get_transition_names()
         {
                 return theme->get_transition_names(pts());
@@ -254,8 +242,6 @@ public:
                 should_cut = true;
         }
  
-       void reset_meters();
-
         unsigned get_num_cards() const { return num_cards; }
  
         std::string get_card_description(unsigned card_index) const {
@@ -326,9 +312,7 @@ private:
         void handle_hotplugged_cards();
         void schedule_audio_resampling_tasks(unsigned dropped_frames, int num_samples_per_frame, int length_per_frame);
         void render_one_frame(int64_t duration);
-       void send_audio_level_callback();
         void audio_thread_func();
-       void process_audio_one_frame(int64_t frame_pts_int, int num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy);
         void subsample_chroma(GLuint src_tex, GLuint dst_dst);
         void release_display_frame(DisplayFrame *frame);
         double pts() { return double(pts_int) / TIMEBASE; }
@@ -426,13 +410,6 @@ private:
         std::atomic<bool> should_quit{false};
         std::atomic<bool> should_cut{false};
  
-       audio_level_callback_t audio_level_callback = nullptr;
-       mutable std::mutex audio_measure_mutex;
-       Ebu_r128_proc r128;  // Under audio_measure_mutex.
-       CorrelationMeasurer correlation;  // Under audio_measure_mutex.
-       Resampler peak_resampler;  // Under audio_measure_mutex.
-       std::atomic<float> peak{0.0f};
-
         std::unique_ptr<ALSAOutput> alsa;
  
         struct AudioTask {
author	Steinar H. Gunderson <sgunderson@bigfoot.com>
	Sat, 13 Aug 2016 17:22:07 +0000 (19:22 +0200)
committer	Steinar H. Gunderson <sgunderson@bigfoot.com>
	Wed, 19 Oct 2016 22:55:44 +0000 (00:55 +0200)
audio_mixer.cpp		patch \| blob \| history
audio_mixer.h		patch \| blob \| history
mainwindow.cpp		patch \| blob \| history
mixer.cpp		patch \| blob \| history
mixer.h		patch \| blob \| history