]> git.sesse.net Git - nageru/blob - audio_mixer.h
Fix an issue where the mixer lagging too much behind CEF would cause us to display...
[nageru] / audio_mixer.h
1 #ifndef _AUDIO_MIXER_H
2 #define _AUDIO_MIXER_H 1
3
4 // The audio mixer, dealing with extracting the right signals from
5 // each capture card, resampling signals so that they are in sync,
6 // processing them with effects (if desired), and then mixing them
7 // all together into one final audio signal.
8 //
9 // All operations on AudioMixer (except destruction) are thread-safe.
10
11 #include <assert.h>
12 #include <stdint.h>
13 #include <zita-resampler/resampler.h>
14 #include <atomic>
15 #include <chrono>
16 #include <functional>
17 #include <map>
18 #include <memory>
19 #include <mutex>
20 #include <set>
21 #include <string>
22 #include <vector>
23
24 #include "alsa_pool.h"
25 #include "correlation_measurer.h"
26 #include "db.h"
27 #include "defs.h"
28 #include "ebu_r128_proc.h"
29 #include "filter.h"
30 #include "input_mapping.h"
31 #include "resampling_queue.h"
32 #include "stereocompressor.h"
33
34 class DeviceSpecProto;
35
36 namespace bmusb {
37 struct AudioFormat;
38 }  // namespace bmusb
39
40 enum EQBand {
41         EQ_BAND_BASS = 0,
42         EQ_BAND_MID,
43         EQ_BAND_TREBLE,
44         NUM_EQ_BANDS
45 };
46
47 class AudioMixer {
48 public:
49         AudioMixer(unsigned num_cards);
50         void reset_resampler(DeviceSpec device_spec);
51         void reset_meters();
52
53         // Add audio (or silence) to the given device's queue. Can return false if
54         // the lock wasn't successfully taken; if so, you should simply try again.
55         // (This is to avoid a deadlock where a card hangs on the mutex in add_audio()
56         // while we are trying to shut it down from another thread that also holds
57         // the mutex.) frame_length is in TIMEBASE units.
58         bool add_audio(DeviceSpec device_spec, const uint8_t *data, unsigned num_samples, bmusb::AudioFormat audio_format, int64_t frame_length, std::chrono::steady_clock::time_point frame_time);
59         bool add_silence(DeviceSpec device_spec, unsigned samples_per_frame, unsigned num_frames, int64_t frame_length);
60
61         // If a given device is offline for whatever reason and cannot deliver audio
62         // (by means of add_audio() or add_silence()), you can call put it in silence mode,
63         // where it will be taken to only output silence. Note that when taking it _out_
64         // of silence mode, the resampler will be reset, so that old audio will not
65         // affect it. Same true/false behavior as add_audio().
66         bool silence_card(DeviceSpec device_spec, bool silence);
67
68         std::vector<float> get_output(std::chrono::steady_clock::time_point ts, unsigned num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy);
69
70         float get_fader_volume(unsigned bus_index) const { return fader_volume_db[bus_index]; }
71         void set_fader_volume(unsigned bus_index, float level_db) { fader_volume_db[bus_index] = level_db; }
72
73         bool get_mute(unsigned bus_index) const { return mute[bus_index]; }
74         void set_mute(unsigned bus_index, bool muted) { mute[bus_index] = muted; }
75
76         // Note: This operation holds all ALSA devices (see ALSAPool::get_devices()).
77         // You will need to call set_input_mapping() to get the hold state correctly,
78         // or every card will be held forever.
79         std::map<DeviceSpec, DeviceInfo> get_devices();
80
81         // See comments on ALSAPool::get_card_state().
82         ALSAPool::Device::State get_alsa_card_state(unsigned index)
83         {
84                 return alsa_pool.get_card_state(index);
85         }
86
87         // See comments on ALSAPool::create_dead_card().
88         DeviceSpec create_dead_card(const std::string &name, const std::string &info, unsigned num_channels)
89         {
90                 unsigned dead_card_index = alsa_pool.create_dead_card(name, info, num_channels);
91                 return DeviceSpec{InputSourceType::ALSA_INPUT, dead_card_index};
92         }
93
94         void set_display_name(DeviceSpec device_spec, const std::string &name);
95
96         // Note: The card should be held (currently this isn't enforced, though).
97         void serialize_device(DeviceSpec device_spec, DeviceSpecProto *device_spec_proto);
98
99         enum class MappingMode {
100                 // A single bus, only from a video card (no ALSA devices),
101                 // only channel 1 and 2, locked to +0 dB. Note that this is
102                 // only an UI abstraction around exactly the same audio code
103                 // as MULTICHANNEL; it's just less flexible.
104                 SIMPLE,
105
106                 // Full, arbitrary mappings.
107                 MULTICHANNEL
108         };
109
110         // Automatically sets mapping mode to MappingMode::SIMPLE.
111         void set_simple_input(unsigned card_index);
112
113         // If mapping mode is not representable as a MappingMode::SIMPLE type
114         // mapping, returns numeric_limits<unsigned>::max().
115         unsigned get_simple_input() const;
116
117         // Implicitly sets mapping mode to MappingMode::MULTICHANNEL.
118         void set_input_mapping(const InputMapping &input_mapping);
119
120         MappingMode get_mapping_mode() const;
121         InputMapping get_input_mapping() const;
122
123         unsigned num_buses() const;
124
125         void set_locut_cutoff(float cutoff_hz)
126         {
127                 locut_cutoff_hz = cutoff_hz;
128         }
129
130         float get_locut_cutoff() const
131         {
132                 return locut_cutoff_hz;
133         }
134
135         void set_locut_enabled(unsigned bus, bool enabled)
136         {
137                 locut_enabled[bus] = enabled;
138         }
139
140         bool get_locut_enabled(unsigned bus)
141         {
142                 return locut_enabled[bus];
143         }
144
145         void set_eq(unsigned bus_index, EQBand band, float db_gain)
146         {
147                 assert(band >= 0 && band < NUM_EQ_BANDS);
148                 eq_level_db[bus_index][band] = db_gain;
149         }
150
151         float get_eq(unsigned bus_index, EQBand band) const
152         {
153                 assert(band >= 0 && band < NUM_EQ_BANDS);
154                 return eq_level_db[bus_index][band];
155         }
156
157         float get_limiter_threshold_dbfs() const
158         {
159                 return limiter_threshold_dbfs;
160         }
161
162         float get_compressor_threshold_dbfs(unsigned bus_index) const
163         {
164                 return compressor_threshold_dbfs[bus_index];
165         }
166
167         void set_limiter_threshold_dbfs(float threshold_dbfs)
168         {
169                 limiter_threshold_dbfs = threshold_dbfs;
170         }
171
172         void set_compressor_threshold_dbfs(unsigned bus_index, float threshold_dbfs)
173         {
174                 compressor_threshold_dbfs[bus_index] = threshold_dbfs;
175         }
176
177         void set_limiter_enabled(bool enabled)
178         {
179                 limiter_enabled = enabled;
180         }
181
182         bool get_limiter_enabled() const
183         {
184                 return limiter_enabled;
185         }
186
187         void set_compressor_enabled(unsigned bus_index, bool enabled)
188         {
189                 compressor_enabled[bus_index] = enabled;
190         }
191
192         bool get_compressor_enabled(unsigned bus_index) const
193         {
194                 return compressor_enabled[bus_index];
195         }
196
197         void set_gain_staging_db(unsigned bus_index, float gain_db)
198         {
199                 std::unique_lock<std::mutex> lock(compressor_mutex);
200                 level_compressor_enabled[bus_index] = false;
201                 gain_staging_db[bus_index] = gain_db;
202         }
203
204         float get_gain_staging_db(unsigned bus_index) const
205         {
206                 std::unique_lock<std::mutex> lock(compressor_mutex);
207                 return gain_staging_db[bus_index];
208         }
209
210         void set_gain_staging_auto(unsigned bus_index, bool enabled)
211         {
212                 std::unique_lock<std::mutex> lock(compressor_mutex);
213                 level_compressor_enabled[bus_index] = enabled;
214         }
215
216         bool get_gain_staging_auto(unsigned bus_index) const
217         {
218                 std::unique_lock<std::mutex> lock(compressor_mutex);
219                 return level_compressor_enabled[bus_index];
220         }
221
222         void set_final_makeup_gain_db(float gain_db)
223         {
224                 std::unique_lock<std::mutex> lock(compressor_mutex);
225                 final_makeup_gain_auto = false;
226                 final_makeup_gain = from_db(gain_db);
227         }
228
229         float get_final_makeup_gain_db()
230         {
231                 std::unique_lock<std::mutex> lock(compressor_mutex);
232                 return to_db(final_makeup_gain);
233         }
234
235         void set_final_makeup_gain_auto(bool enabled)
236         {
237                 std::unique_lock<std::mutex> lock(compressor_mutex);
238                 final_makeup_gain_auto = enabled;
239         }
240
241         bool get_final_makeup_gain_auto() const
242         {
243                 std::unique_lock<std::mutex> lock(compressor_mutex);
244                 return final_makeup_gain_auto;
245         }
246
247         void reset_peak(unsigned bus_index);
248
249         struct BusLevel {
250                 float current_level_dbfs[2];  // Digital peak of last frame, left and right.
251                 float peak_level_dbfs[2];  // Digital peak with hold, left and right.
252                 float historic_peak_dbfs;
253                 float gain_staging_db;
254                 float compressor_attenuation_db;  // A positive number; 0.0 for no attenuation.
255         };
256
257         typedef std::function<void(float level_lufs, float peak_db,
258                                    std::vector<BusLevel> bus_levels,
259                                    float global_level_lufs, float range_low_lufs, float range_high_lufs,
260                                    float final_makeup_gain_db,
261                                    float correlation)> audio_level_callback_t;
262         void set_audio_level_callback(audio_level_callback_t callback)
263         {
264                 audio_level_callback = callback;
265         }
266
267         typedef std::function<void()> state_changed_callback_t;
268         void set_state_changed_callback(state_changed_callback_t callback)
269         {
270                 state_changed_callback = callback;
271         }
272
273         state_changed_callback_t get_state_changed_callback() const
274         {
275                 return state_changed_callback;
276         }
277
278         void trigger_state_changed_callback()
279         {
280                 if (state_changed_callback != nullptr) {
281                         state_changed_callback();
282                 }
283         }
284
285         // A combination of all settings for a bus. Useful if you want to get
286         // or store them as a whole without bothering to call all of the get_*
287         // or set_* functions for that bus.
288         struct BusSettings {
289                 float fader_volume_db;
290                 bool muted;
291                 bool locut_enabled;
292                 float eq_level_db[NUM_EQ_BANDS];
293                 float gain_staging_db;
294                 bool level_compressor_enabled;
295                 float compressor_threshold_dbfs;
296                 bool compressor_enabled;
297         };
298         static BusSettings get_default_bus_settings();
299         BusSettings get_bus_settings(unsigned bus_index) const;
300         void set_bus_settings(unsigned bus_index, const BusSettings &settings);
301
302 private:
303         struct AudioDevice {
304                 std::unique_ptr<ResamplingQueue> resampling_queue;
305                 std::string display_name;
306                 unsigned capture_frequency = OUTPUT_FREQUENCY;
307                 // Which channels we consider interesting (ie., are part of some input_mapping).
308                 std::set<unsigned> interesting_channels;
309                 bool silenced = false;
310         };
311
312         const AudioDevice *find_audio_device(DeviceSpec device_spec) const
313         {
314                 return const_cast<AudioMixer *>(this)->find_audio_device(device_spec);
315         }
316
317         AudioDevice *find_audio_device(DeviceSpec device_spec);
318
319         void find_sample_src_from_device(const std::map<DeviceSpec, std::vector<float>> &samples_card, DeviceSpec device_spec, int source_channel, const float **srcptr, unsigned *stride);
320         void fill_audio_bus(const std::map<DeviceSpec, std::vector<float>> &samples_card, const InputMapping::Bus &bus, unsigned num_samples, float *output);
321         void reset_resampler_mutex_held(DeviceSpec device_spec);
322         void apply_eq(unsigned bus_index, std::vector<float> *samples_bus);
323         void update_meters(const std::vector<float> &samples);
324         void add_bus_to_master(unsigned bus_index, const std::vector<float> &samples_bus, std::vector<float> *samples_out);
325         void measure_bus_levels(unsigned bus_index, const std::vector<float> &left, const std::vector<float> &right);
326         void send_audio_level_callback();
327         std::vector<DeviceSpec> get_active_devices() const;
328         void set_input_mapping_lock_held(const InputMapping &input_mapping);
329
330         unsigned num_cards;
331
332         mutable std::timed_mutex audio_mutex;
333
334         ALSAPool alsa_pool;
335         AudioDevice video_cards[MAX_VIDEO_CARDS];  // Under audio_mutex.
336         AudioDevice alsa_inputs[MAX_ALSA_CARDS];  // Under audio_mutex.
337
338         std::atomic<float> locut_cutoff_hz{120};
339         StereoFilter locut[MAX_BUSES];  // Default cutoff 120 Hz, 24 dB/oct.
340         std::atomic<bool> locut_enabled[MAX_BUSES];
341         StereoFilter eq[MAX_BUSES][NUM_EQ_BANDS];  // The one for EQBand::MID isn't actually used (see comments in apply_eq()).
342
343         // First compressor; takes us up to about -12 dBFS.
344         mutable std::mutex compressor_mutex;
345         std::unique_ptr<StereoCompressor> level_compressor[MAX_BUSES];  // Under compressor_mutex. Used to set/override gain_staging_db if <level_compressor_enabled>.
346         float gain_staging_db[MAX_BUSES];  // Under compressor_mutex.
347         float last_gain_staging_db[MAX_BUSES];  // Under compressor_mutex.
348         bool level_compressor_enabled[MAX_BUSES];  // Under compressor_mutex.
349
350         static constexpr float ref_level_dbfs = -14.0f;  // Chosen so that we end up around 0 LU in practice.
351         static constexpr float ref_level_lufs = -23.0f;  // 0 LU, more or less by definition.
352
353         StereoCompressor limiter;
354         std::atomic<float> limiter_threshold_dbfs{ref_level_dbfs + 4.0f};   // 4 dB.
355         std::atomic<bool> limiter_enabled{true};
356         std::unique_ptr<StereoCompressor> compressor[MAX_BUSES];
357         std::atomic<float> compressor_threshold_dbfs[MAX_BUSES];
358         std::atomic<bool> compressor_enabled[MAX_BUSES];
359
360         // Note: The values here are not in dB.
361         struct PeakHistory {
362                 float current_level = 0.0f;  // Peak of the last frame.
363                 float historic_peak = 0.0f;  // Highest peak since last reset; no falloff.
364                 float current_peak = 0.0f;  // Current peak of the peak meter.
365                 float last_peak = 0.0f;
366                 float age_seconds = 0.0f;   // Time since "last_peak" was set.
367         };
368         PeakHistory peak_history[MAX_BUSES][2];  // Separate for each channel. Under audio_mutex.
369
370         double final_makeup_gain = 1.0;  // Under compressor_mutex. Read/write by the user. Note: Not in dB, we want the numeric precision so that we can change it slowly.
371         bool final_makeup_gain_auto = true;  // Under compressor_mutex.
372
373         MappingMode current_mapping_mode;  // Under audio_mutex.
374         InputMapping input_mapping;  // Under audio_mutex.
375         std::atomic<float> fader_volume_db[MAX_BUSES] {{ 0.0f }};
376         std::atomic<bool> mute[MAX_BUSES] {{ false }};
377         float last_fader_volume_db[MAX_BUSES] { 0.0f };  // Under audio_mutex.
378         std::atomic<float> eq_level_db[MAX_BUSES][NUM_EQ_BANDS] {{{ 0.0f }}};
379         float last_eq_level_db[MAX_BUSES][NUM_EQ_BANDS] {{ 0.0f }};
380
381         audio_level_callback_t audio_level_callback = nullptr;
382         state_changed_callback_t state_changed_callback = nullptr;
383         mutable std::mutex audio_measure_mutex;
384         Ebu_r128_proc r128;  // Under audio_measure_mutex.
385         CorrelationMeasurer correlation;  // Under audio_measure_mutex.
386         Resampler peak_resampler;  // Under audio_measure_mutex.
387         std::atomic<float> peak{0.0f};
388
389         // Metrics.
390         std::atomic<double> metric_audio_loudness_short_lufs{0.0 / 0.0};
391         std::atomic<double> metric_audio_loudness_integrated_lufs{0.0 / 0.0};
392         std::atomic<double> metric_audio_loudness_range_low_lufs{0.0 / 0.0};
393         std::atomic<double> metric_audio_loudness_range_high_lufs{0.0 / 0.0};
394         std::atomic<double> metric_audio_peak_dbfs{0.0 / 0.0};
395         std::atomic<double> metric_audio_final_makeup_gain_db{0.0};
396         std::atomic<double> metric_audio_correlation{0.0};
397
398         // These are all gauges corresponding to the elements of BusLevel.
399         // In a sense, they'd probably do better as histograms, but that's an
400         // awful lot of time series when you have many buses.
401         struct BusMetrics {
402                 std::vector<std::pair<std::string, std::string>> labels;
403                 std::atomic<double> current_level_dbfs[2]{{0.0/0.0},{0.0/0.0}};
404                 std::atomic<double> peak_level_dbfs[2]{{0.0/0.0},{0.0/0.0}};
405                 std::atomic<double> historic_peak_dbfs{0.0/0.0};
406                 std::atomic<double> gain_staging_db{0.0/0.0};
407                 std::atomic<double> compressor_attenuation_db{0.0/0.0};
408         };
409         std::unique_ptr<BusMetrics[]> bus_metrics;  // One for each bus in <input_mapping>.
410 };
411
412 extern AudioMixer *global_audio_mixer;
413
414 #endif  // !defined(_AUDIO_MIXER_H)