]> git.sesse.net Git - nageru/blob - audio_mixer.h
Do not use the timing of dropped frames as part of the video master clock.
[nageru] / audio_mixer.h
1 #ifndef _AUDIO_MIXER_H
2 #define _AUDIO_MIXER_H 1
3
4 // The audio mixer, dealing with extracting the right signals from
5 // each capture card, resampling signals so that they are in sync,
6 // processing them with effects (if desired), and then mixing them
7 // all together into one final audio signal.
8 //
9 // All operations on AudioMixer (except destruction) are thread-safe.
10
11 #include <math.h>
12 #include <stdint.h>
13 #include <atomic>
14 #include <map>
15 #include <memory>
16 #include <mutex>
17 #include <set>
18 #include <vector>
19 #include <zita-resampler/resampler.h>
20
21 #include "alsa_input.h"
22 #include "alsa_pool.h"
23 #include "bmusb/bmusb.h"
24 #include "correlation_measurer.h"
25 #include "db.h"
26 #include "defs.h"
27 #include "ebu_r128_proc.h"
28 #include "filter.h"
29 #include "input_mapping.h"
30 #include "resampling_queue.h"
31 #include "stereocompressor.h"
32
33 namespace bmusb {
34 struct AudioFormat;
35 }  // namespace bmusb
36
37 enum EQBand {
38         EQ_BAND_BASS = 0,
39         EQ_BAND_MID,
40         EQ_BAND_TREBLE,
41         NUM_EQ_BANDS
42 };
43
44 class AudioMixer {
45 public:
46         AudioMixer(unsigned num_cards);
47         void reset_resampler(DeviceSpec device_spec);
48         void reset_meters();
49
50         // Add audio (or silence) to the given device's queue. Can return false if
51         // the lock wasn't successfully taken; if so, you should simply try again.
52         // (This is to avoid a deadlock where a card hangs on the mutex in add_audio()
53         // while we are trying to shut it down from another thread that also holds
54         // the mutex.) frame_length is in TIMEBASE units.
55         bool add_audio(DeviceSpec device_spec, const uint8_t *data, unsigned num_samples, bmusb::AudioFormat audio_format, int64_t frame_length);
56         bool add_silence(DeviceSpec device_spec, unsigned samples_per_frame, unsigned num_frames, int64_t frame_length);
57
58         // If a given device is offline for whatever reason and cannot deliver audio
59         // (by means of add_audio() or add_silence()), you can call put it in silence mode,
60         // where it will be taken to only output silence. Note that when taking it _out_
61         // of silence mode, the resampler will be reset, so that old audio will not
62         // affect it. Same true/false behavior as add_audio().
63         bool silence_card(DeviceSpec device_spec, bool silence);
64
65         std::vector<float> get_output(double pts, unsigned num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy);
66
67         float get_fader_volume(unsigned bus_index) const { return fader_volume_db[bus_index]; }
68         void set_fader_volume(unsigned bus_index, float level_db) { fader_volume_db[bus_index] = level_db; }
69
70         // Note: This operation holds all ALSA devices (see ALSAPool::get_devices()).
71         // You will need to call set_input_mapping() to get the hold state correctly,
72         // or every card will be held forever.
73         std::map<DeviceSpec, DeviceInfo> get_devices();
74
75         // See comments on ALSAPool::get_card_state().
76         ALSAPool::Device::State get_alsa_card_state(unsigned index)
77         {
78                 return alsa_pool.get_card_state(index);
79         }
80
81         // See comments on ALSAPool::create_dead_card().
82         DeviceSpec create_dead_card(const std::string &name, const std::string &info, unsigned num_channels)
83         {
84                 unsigned dead_card_index = alsa_pool.create_dead_card(name, info, num_channels);
85                 return DeviceSpec{InputSourceType::ALSA_INPUT, dead_card_index};
86         }
87
88         void set_display_name(DeviceSpec device_spec, const std::string &name);
89
90         // Note: The card should be held (currently this isn't enforced, though).
91         void serialize_device(DeviceSpec device_spec, DeviceSpecProto *device_spec_proto);
92
93         void set_input_mapping(const InputMapping &input_mapping);
94         InputMapping get_input_mapping() const;
95
96         void set_locut_cutoff(float cutoff_hz)
97         {
98                 locut_cutoff_hz = cutoff_hz;
99         }
100
101         float get_locut_cutoff() const
102         {
103                 return locut_cutoff_hz;
104         }
105
106         void set_locut_enabled(unsigned bus, bool enabled)
107         {
108                 locut_enabled[bus] = enabled;
109         }
110
111         bool get_locut_enabled(unsigned bus)
112         {
113                 return locut_enabled[bus];
114         }
115
116         void set_eq(unsigned bus_index, EQBand band, float db_gain)
117         {
118                 assert(band >= 0 && band < NUM_EQ_BANDS);
119                 eq_level_db[bus_index][band] = db_gain;
120         }
121
122         float get_eq(unsigned bus_index, EQBand band) const
123         {
124                 assert(band >= 0 && band < NUM_EQ_BANDS);
125                 return eq_level_db[bus_index][band];
126         }
127
128         float get_limiter_threshold_dbfs() const
129         {
130                 return limiter_threshold_dbfs;
131         }
132
133         float get_compressor_threshold_dbfs(unsigned bus_index) const
134         {
135                 return compressor_threshold_dbfs[bus_index];
136         }
137
138         void set_limiter_threshold_dbfs(float threshold_dbfs)
139         {
140                 limiter_threshold_dbfs = threshold_dbfs;
141         }
142
143         void set_compressor_threshold_dbfs(unsigned bus_index, float threshold_dbfs)
144         {
145                 compressor_threshold_dbfs[bus_index] = threshold_dbfs;
146         }
147
148         void set_limiter_enabled(bool enabled)
149         {
150                 limiter_enabled = enabled;
151         }
152
153         bool get_limiter_enabled() const
154         {
155                 return limiter_enabled;
156         }
157
158         void set_compressor_enabled(unsigned bus_index, bool enabled)
159         {
160                 compressor_enabled[bus_index] = enabled;
161         }
162
163         bool get_compressor_enabled(unsigned bus_index) const
164         {
165                 return compressor_enabled[bus_index];
166         }
167
168         void set_gain_staging_db(unsigned bus_index, float gain_db)
169         {
170                 std::unique_lock<std::mutex> lock(compressor_mutex);
171                 level_compressor_enabled[bus_index] = false;
172                 gain_staging_db[bus_index] = gain_db;
173         }
174
175         float get_gain_staging_db(unsigned bus_index) const
176         {
177                 std::unique_lock<std::mutex> lock(compressor_mutex);
178                 return gain_staging_db[bus_index];
179         }
180
181         void set_gain_staging_auto(unsigned bus_index, bool enabled)
182         {
183                 std::unique_lock<std::mutex> lock(compressor_mutex);
184                 level_compressor_enabled[bus_index] = enabled;
185         }
186
187         bool get_gain_staging_auto(unsigned bus_index) const
188         {
189                 std::unique_lock<std::mutex> lock(compressor_mutex);
190                 return level_compressor_enabled[bus_index];
191         }
192
193         void set_final_makeup_gain_db(float gain_db)
194         {
195                 std::unique_lock<std::mutex> lock(compressor_mutex);
196                 final_makeup_gain_auto = false;
197                 final_makeup_gain = from_db(gain_db);
198         }
199
200         float get_final_makeup_gain_db()
201         {
202                 std::unique_lock<std::mutex> lock(compressor_mutex);
203                 return to_db(final_makeup_gain);
204         }
205
206         void set_final_makeup_gain_auto(bool enabled)
207         {
208                 std::unique_lock<std::mutex> lock(compressor_mutex);
209                 final_makeup_gain_auto = enabled;
210         }
211
212         bool get_final_makeup_gain_auto() const
213         {
214                 std::unique_lock<std::mutex> lock(compressor_mutex);
215                 return final_makeup_gain_auto;
216         }
217
218         void reset_peak(unsigned bus_index);
219
220         struct BusLevel {
221                 float current_level_dbfs[2];  // Digital peak of last frame, left and right.
222                 float peak_level_dbfs[2];  // Digital peak with hold, left and right.
223                 float historic_peak_dbfs;
224                 float gain_staging_db;
225                 float compressor_attenuation_db;  // A positive number; 0.0 for no attenuation.
226         };
227
228         typedef std::function<void(float level_lufs, float peak_db,
229                                    std::vector<BusLevel> bus_levels,
230                                    float global_level_lufs, float range_low_lufs, float range_high_lufs,
231                                    float final_makeup_gain_db,
232                                    float correlation)> audio_level_callback_t;
233         void set_audio_level_callback(audio_level_callback_t callback)
234         {
235                 audio_level_callback = callback;
236         }
237
238         typedef std::function<void()> state_changed_callback_t;
239         void set_state_changed_callback(state_changed_callback_t callback)
240         {
241                 state_changed_callback = callback;
242         }
243
244         state_changed_callback_t get_state_changed_callback() const
245         {
246                 return state_changed_callback;
247         }
248
249         void trigger_state_changed_callback()
250         {
251                 if (state_changed_callback != nullptr) {
252                         state_changed_callback();
253                 }
254         }
255
256         // A combination of all settings for a bus. Useful if you want to get
257         // or store them as a whole without bothering to call all of the get_*
258         // or set_* functions for that bus.
259         struct BusSettings {
260                 float fader_volume_db;
261                 bool locut_enabled;
262                 float eq_level_db[NUM_EQ_BANDS];
263                 float gain_staging_db;
264                 bool level_compressor_enabled;
265                 float compressor_threshold_dbfs;
266                 bool compressor_enabled;
267         };
268         static BusSettings get_default_bus_settings();
269         BusSettings get_bus_settings(unsigned bus_index) const;
270         void set_bus_settings(unsigned bus_index, const BusSettings &settings);
271
272 private:
273         struct AudioDevice {
274                 std::unique_ptr<ResamplingQueue> resampling_queue;
275                 int64_t next_local_pts = 0;
276                 std::string display_name;
277                 unsigned capture_frequency = OUTPUT_FREQUENCY;
278                 // Which channels we consider interesting (ie., are part of some input_mapping).
279                 std::set<unsigned> interesting_channels;
280                 bool silenced = false;
281         };
282
283         const AudioDevice *find_audio_device(DeviceSpec device_spec) const
284         {
285                 return const_cast<AudioMixer *>(this)->find_audio_device(device_spec);
286         }
287
288         AudioDevice *find_audio_device(DeviceSpec device_spec);
289
290         void find_sample_src_from_device(const std::map<DeviceSpec, std::vector<float>> &samples_card, DeviceSpec device_spec, int source_channel, const float **srcptr, unsigned *stride);
291         void fill_audio_bus(const std::map<DeviceSpec, std::vector<float>> &samples_card, const InputMapping::Bus &bus, unsigned num_samples, float *output);
292         void reset_resampler_mutex_held(DeviceSpec device_spec);
293         void apply_eq(unsigned bus_index, std::vector<float> *samples_bus);
294         void update_meters(const std::vector<float> &samples);
295         void add_bus_to_master(unsigned bus_index, const std::vector<float> &samples_bus, std::vector<float> *samples_out);
296         void measure_bus_levels(unsigned bus_index, const std::vector<float> &left, const std::vector<float> &right);
297         void send_audio_level_callback();
298         std::vector<DeviceSpec> get_active_devices() const;
299
300         unsigned num_cards;
301
302         mutable std::timed_mutex audio_mutex;
303
304         ALSAPool alsa_pool;
305         AudioDevice video_cards[MAX_VIDEO_CARDS];  // Under audio_mutex.
306         AudioDevice alsa_inputs[MAX_ALSA_CARDS];  // Under audio_mutex.
307
308         std::atomic<float> locut_cutoff_hz{120};
309         StereoFilter locut[MAX_BUSES];  // Default cutoff 120 Hz, 24 dB/oct.
310         std::atomic<bool> locut_enabled[MAX_BUSES];
311         StereoFilter eq[MAX_BUSES][NUM_EQ_BANDS];  // The one for EQBand::MID isn't actually used (see comments in apply_eq()).
312
313         // First compressor; takes us up to about -12 dBFS.
314         mutable std::mutex compressor_mutex;
315         std::unique_ptr<StereoCompressor> level_compressor[MAX_BUSES];  // Under compressor_mutex. Used to set/override gain_staging_db if <level_compressor_enabled>.
316         float gain_staging_db[MAX_BUSES];  // Under compressor_mutex.
317         bool level_compressor_enabled[MAX_BUSES];  // Under compressor_mutex.
318
319         static constexpr float ref_level_dbfs = -14.0f;  // Chosen so that we end up around 0 LU in practice.
320         static constexpr float ref_level_lufs = -23.0f;  // 0 LU, more or less by definition.
321
322         StereoCompressor limiter;
323         std::atomic<float> limiter_threshold_dbfs{ref_level_dbfs + 4.0f};   // 4 dB.
324         std::atomic<bool> limiter_enabled{true};
325         std::unique_ptr<StereoCompressor> compressor[MAX_BUSES];
326         std::atomic<float> compressor_threshold_dbfs[MAX_BUSES];
327         std::atomic<bool> compressor_enabled[MAX_BUSES];
328
329         // Note: The values here are not in dB.
330         struct PeakHistory {
331                 float current_level = 0.0f;  // Peak of the last frame.
332                 float historic_peak = 0.0f;  // Highest peak since last reset; no falloff.
333                 float current_peak = 0.0f;  // Current peak of the peak meter.
334                 float last_peak = 0.0f;
335                 float age_seconds = 0.0f;   // Time since "last_peak" was set.
336         };
337         PeakHistory peak_history[MAX_BUSES][2];  // Separate for each channel. Under audio_mutex.
338
339         double final_makeup_gain = 1.0;  // Under compressor_mutex. Read/write by the user. Note: Not in dB, we want the numeric precision so that we can change it slowly.
340         bool final_makeup_gain_auto = true;  // Under compressor_mutex.
341
342         InputMapping input_mapping;  // Under audio_mutex.
343         std::atomic<float> fader_volume_db[MAX_BUSES] {{ 0.0f }};
344         float last_fader_volume_db[MAX_BUSES] { 0.0f };  // Under audio_mutex.
345         std::atomic<float> eq_level_db[MAX_BUSES][NUM_EQ_BANDS] {{{ 0.0f }}};
346         float last_eq_level_db[MAX_BUSES][NUM_EQ_BANDS] {{ 0.0f }};
347
348         audio_level_callback_t audio_level_callback = nullptr;
349         state_changed_callback_t state_changed_callback = nullptr;
350         mutable std::mutex audio_measure_mutex;
351         Ebu_r128_proc r128;  // Under audio_measure_mutex.
352         CorrelationMeasurer correlation;  // Under audio_measure_mutex.
353         Resampler peak_resampler;  // Under audio_measure_mutex.
354         std::atomic<float> peak{0.0f};
355 };
356
357 extern AudioMixer *global_audio_mixer;
358
359 #endif  // !defined(_AUDIO_MIXER_H)