X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=audio_mixer.cpp;h=6b7ffeb0d6d28fb1ffdbfa8308ab341970893b20;hb=54067dbc70999d936adf9d263b5ff2b1efb4dfd0;hp=7a36b0de255e53daeeb96e0fcc2de5521b411364;hpb=a803d2e93f69b6aa968e6b0f4a8498d0ef1b3b70;p=nageru

diff --git a/audio_mixer.cpp b/audio_mixer.cpp
index 7a36b0d..6b7ffeb 100644
--- a/audio_mixer.cpp
+++ b/audio_mixer.cpp
@@ -4,7 +4,11 @@
 #include <endian.h>
 #include <bmusb/bmusb.h>
 #include <stdio.h>
+#include <endian.h>
 #include <cmath>
+#ifdef __SSE__
+#include <immintrin.h>
+#endif
 
 #include "db.h"
 #include "flags.h"
@@ -12,36 +16,141 @@
 
 using namespace bmusb;
 using namespace std;
+using namespace std::placeholders;
 
 namespace {
 
-// TODO: If these prove to be a bottleneck, they can be SSSE3-optimized.
+// TODO: If these prove to be a bottleneck, they can be SSSE3-optimized
+// (usually including multiple channels at a time).
 
-void convert_fixed24_to_fp32(float *dst, size_t out_channels, const uint8_t *src, size_t in_channels, size_t num_samples)
+void convert_fixed16_to_fp32(float *dst, size_t out_channel, size_t out_num_channels,
+                             const uint8_t *src, size_t in_channel, size_t in_num_channels,
+                             size_t num_samples)
 {
-	assert(in_channels >= out_channels);
+	assert(in_channel < in_num_channels);
+	assert(out_channel < out_num_channels);
+	src += in_channel * 2;
+	dst += out_channel;
+
 	for (size_t i = 0; i < num_samples; ++i) {
-		for (size_t j = 0; j < out_channels; ++j) {
-			uint32_t s1 = *src++;
-			uint32_t s2 = *src++;
-			uint32_t s3 = *src++;
-			uint32_t s = s1 | (s1 << 8) | (s2 << 16) | (s3 << 24);
-			dst[i * out_channels + j] = int(s) * (1.0f / 2147483648.0f);
-		}
-		src += 3 * (in_channels - out_channels);
+		int16_t s = le16toh(*(int16_t *)src);
+		*dst = s * (1.0f / 32768.0f);
+
+		src += 2 * in_num_channels;
+		dst += out_num_channels;
 	}
 }
 
-void convert_fixed32_to_fp32(float *dst, size_t out_channels, const uint8_t *src, size_t in_channels, size_t num_samples)
+void convert_fixed24_to_fp32(float *dst, size_t out_channel, size_t out_num_channels,
+                             const uint8_t *src, size_t in_channel, size_t in_num_channels,
+                             size_t num_samples)
 {
-	assert(in_channels >= out_channels);
+	assert(in_channel < in_num_channels);
+	assert(out_channel < out_num_channels);
+	src += in_channel * 3;
+	dst += out_channel;
+
 	for (size_t i = 0; i < num_samples; ++i) {
-		for (size_t j = 0; j < out_channels; ++j) {
-			int32_t s = le32toh(*(int32_t *)src);
-			dst[i * out_channels + j] = s * (1.0f / 2147483648.0f);
-			src += 4;
-		}
-		src += 4 * (in_channels - out_channels);
+		uint32_t s1 = src[0];
+		uint32_t s2 = src[1];
+		uint32_t s3 = src[2];
+		uint32_t s = s1 | (s1 << 8) | (s2 << 16) | (s3 << 24);
+		*dst = int(s) * (1.0f / 2147483648.0f);
+
+		src += 3 * in_num_channels;
+		dst += out_num_channels;
+	}
+}
+
+void convert_fixed32_to_fp32(float *dst, size_t out_channel, size_t out_num_channels,
+                             const uint8_t *src, size_t in_channel, size_t in_num_channels,
+                             size_t num_samples)
+{
+	assert(in_channel < in_num_channels);
+	assert(out_channel < out_num_channels);
+	src += in_channel * 4;
+	dst += out_channel;
+
+	for (size_t i = 0; i < num_samples; ++i) {
+		int32_t s = le32toh(*(int32_t *)src);
+		*dst = s * (1.0f / 2147483648.0f);
+
+		src += 4 * in_num_channels;
+		dst += out_num_channels;
+	}
+}
+
+float find_peak_plain(const float *samples, size_t num_samples) __attribute__((unused));
+
+float find_peak_plain(const float *samples, size_t num_samples)
+{
+	float m = fabs(samples[0]);
+	for (size_t i = 1; i < num_samples; ++i) {
+		m = max(m, fabs(samples[i]));
+	}
+	return m;
+}
+
+#ifdef __SSE__
+static inline float horizontal_max(__m128 m)
+{
+	__m128 tmp = _mm_shuffle_ps(m, m, _MM_SHUFFLE(1, 0, 3, 2));
+	m = _mm_max_ps(m, tmp);
+	tmp = _mm_shuffle_ps(m, m, _MM_SHUFFLE(2, 3, 0, 1));
+	m = _mm_max_ps(m, tmp);
+	return _mm_cvtss_f32(m);
+}
+
+float find_peak(const float *samples, size_t num_samples)
+{
+	const __m128 abs_mask = _mm_castsi128_ps(_mm_set1_epi32(0x7fffffffu));
+	__m128 m = _mm_setzero_ps();
+	for (size_t i = 0; i < (num_samples & ~3); i += 4) {
+		__m128 x = _mm_loadu_ps(samples + i);
+		x = _mm_and_ps(x, abs_mask);
+		m = _mm_max_ps(m, x);
+	}
+	float result = horizontal_max(m);
+
+	for (size_t i = (num_samples & ~3); i < num_samples; ++i) {
+		result = max(result, fabs(samples[i]));
+	}
+
+#if 0
+	// Self-test. We should be bit-exact the same.
+	float reference_result = find_peak_plain(samples, num_samples);
+	if (result != reference_result) {
+		fprintf(stderr, "Error: Peak is %f [%f %f %f %f]; should be %f.\n",
+			result,
+			_mm_cvtss_f32(_mm_shuffle_ps(m, m, _MM_SHUFFLE(0, 0, 0, 0))),
+			_mm_cvtss_f32(_mm_shuffle_ps(m, m, _MM_SHUFFLE(1, 1, 1, 1))),
+			_mm_cvtss_f32(_mm_shuffle_ps(m, m, _MM_SHUFFLE(2, 2, 2, 2))),
+			_mm_cvtss_f32(_mm_shuffle_ps(m, m, _MM_SHUFFLE(3, 3, 3, 3))),
+			reference_result);
+		abort();
+	}
+#endif
+	return result;
+}
+#else
+float find_peak(const float *samples, size_t num_samples)
+{
+	return find_peak_plain(samples, num_samples);
+}
+#endif
+
+void deinterleave_samples(const vector<float> &in, vector<float> *out_l, vector<float> *out_r)
+{
+	size_t num_samples = in.size() / 2;
+	out_l->resize(num_samples);
+	out_r->resize(num_samples);
+
+	const float *inptr = in.data();
+	float *lptr = &(*out_l)[0];
+	float *rptr = &(*out_r)[0];
+	for (size_t i = 0; i < num_samples; ++i) {
+		*lptr++ = *inptr++;
+		*rptr++ = *inptr++;
 	}
 }
 
@@ -49,170 +158,312 @@ void convert_fixed32_to_fp32(float *dst, size_t out_channels, const uint8_t *src
 
 AudioMixer::AudioMixer(unsigned num_cards)
 	: num_cards(num_cards),
-	  level_compressor(OUTPUT_FREQUENCY),
 	  limiter(OUTPUT_FREQUENCY),
-	  compressor(OUTPUT_FREQUENCY)
+	  correlation(OUTPUT_FREQUENCY)
 {
-	locut.init(FILTER_HPF, 2);
-
-	set_locut_enabled(global_flags.locut_enabled);
-	set_gain_staging_db(global_flags.initial_gain_staging_db);
-	set_gain_staging_auto(global_flags.gain_staging_auto);
-	set_compressor_enabled(global_flags.compressor_enabled);
+	for (unsigned bus_index = 0; bus_index < MAX_BUSES; ++bus_index) {
+		locut[bus_index].init(FILTER_HPF, 2);
+		locut_enabled[bus_index] = global_flags.locut_enabled;
+		gain_staging_db[bus_index] = global_flags.initial_gain_staging_db;
+		compressor[bus_index].reset(new StereoCompressor(OUTPUT_FREQUENCY));
+		compressor_threshold_dbfs[bus_index] = ref_level_dbfs - 12.0f;  // -12 dB.
+		compressor_enabled[bus_index] = global_flags.compressor_enabled;
+		level_compressor[bus_index].reset(new StereoCompressor(OUTPUT_FREQUENCY));
+		level_compressor_enabled[bus_index] = global_flags.gain_staging_auto;
+	}
 	set_limiter_enabled(global_flags.limiter_enabled);
 	set_final_makeup_gain_auto(global_flags.final_makeup_gain_auto);
 
 	// Generate a very simple, default input mapping.
-	InputMapping::Input input;
+	InputMapping::Bus input;
 	input.name = "Main";
-	input.input_source_type = InputSourceType::CAPTURE_CARD;
-	input.input_source_index = 0;
+	input.device.type = InputSourceType::CAPTURE_CARD;
+	input.device.index = 0;
 	input.source_channel[0] = 0;
 	input.source_channel[1] = 1;
 
 	InputMapping new_input_mapping;
-	new_input_mapping.inputs.push_back(input);
+	new_input_mapping.buses.push_back(input);
 	set_input_mapping(new_input_mapping);
+
+	// Look for ALSA cards.
+	available_alsa_cards = ALSAInput::enumerate_devices();
+
+	r128.init(2, OUTPUT_FREQUENCY);
+	r128.integr_start();
+
+	// hlen=16 is pretty low quality, but we use quite a bit of CPU otherwise,
+	// and there's a limit to how important the peak meter is.
+	peak_resampler.setup(OUTPUT_FREQUENCY, OUTPUT_FREQUENCY * 4, /*num_channels=*/2, /*hlen=*/16, /*frel=*/1.0);
+}
+
+AudioMixer::~AudioMixer()
+{
+	for (unsigned card_index = 0; card_index < available_alsa_cards.size(); ++card_index) {
+		const AudioDevice &device = alsa_inputs[card_index];
+		if (device.alsa_device != nullptr) {
+			device.alsa_device->stop_capture_thread();
+		}
+	}
 }
 
-void AudioMixer::reset_card(unsigned card_index)
+
+void AudioMixer::reset_resampler(DeviceSpec device_spec)
 {
-	lock_guard<mutex> lock(audio_mutex);
-	reset_card_mutex_held(card_index);
+	lock_guard<timed_mutex> lock(audio_mutex);
+	reset_resampler_mutex_held(device_spec);
 }
 
-void AudioMixer::reset_card_mutex_held(unsigned card_index)
+void AudioMixer::reset_resampler_mutex_held(DeviceSpec device_spec)
 {
-	CaptureCard *card = &cards[card_index];
-	if (card->interesting_channels.empty()) {
-		card->resampling_queue.reset();
+	AudioDevice *device = find_audio_device(device_spec);
+
+	if (device->interesting_channels.empty()) {
+		device->resampling_queue.reset();
 	} else {
-		card->resampling_queue.reset(new ResamplingQueue(card_index, OUTPUT_FREQUENCY, OUTPUT_FREQUENCY, card->interesting_channels.size()));
+		// TODO: ResamplingQueue should probably take the full device spec.
+		// (It's only used for console output, though.)
+		device->resampling_queue.reset(new ResamplingQueue(device_spec.index, device->capture_frequency, OUTPUT_FREQUENCY, device->interesting_channels.size()));
 	}
-	card->next_local_pts = 0;
+	device->next_local_pts = 0;
 }
 
-void AudioMixer::add_audio(unsigned card_index, const uint8_t *data, unsigned num_samples, AudioFormat audio_format, int64_t frame_length)
+void AudioMixer::reset_alsa_mutex_held(DeviceSpec device_spec)
 {
-	lock_guard<mutex> lock(audio_mutex);
-	CaptureCard *card = &cards[card_index];
+	assert(device_spec.type == InputSourceType::ALSA_INPUT);
+	unsigned card_index = device_spec.index;
+	AudioDevice *device = find_audio_device(device_spec);
 
-	if (card->resampling_queue == nullptr) {
-		// No inputs use this card; throw it away.
-		return;
+	if (device->alsa_device != nullptr) {
+		device->alsa_device->stop_capture_thread();
+	}
+	if (device->interesting_channels.empty()) {
+		device->alsa_device.reset();
+	} else {
+		const ALSAInput::Device &alsa_dev = available_alsa_cards[card_index];
+		device->alsa_device.reset(new ALSAInput(alsa_dev.address.c_str(), OUTPUT_FREQUENCY, alsa_dev.num_channels, bind(&AudioMixer::add_audio, this, device_spec, _1, _2, _3, _4)));
+		device->capture_frequency = device->alsa_device->get_sample_rate();
+		device->alsa_device->start_capture_thread();
+	}
+}
+
+bool AudioMixer::add_audio(DeviceSpec device_spec, const uint8_t *data, unsigned num_samples, AudioFormat audio_format, int64_t frame_length)
+{
+	AudioDevice *device = find_audio_device(device_spec);
+
+	unique_lock<timed_mutex> lock(audio_mutex, defer_lock);
+	if (!lock.try_lock_for(chrono::milliseconds(10))) {
+		return false;
+	}
+	if (device->resampling_queue == nullptr) {
+		// No buses use this device; throw it away.
+		return true;
 	}
 
-	unsigned num_channels = card->interesting_channels.size();
+	unsigned num_channels = device->interesting_channels.size();
 	assert(num_channels > 0);
 
-	// Convert the audio to stereo fp32.
-	// FIXME: Pick out the right channels; this takes the first ones.
-	vector<float> audio;
-	audio.resize(num_samples * num_channels);
-	switch (audio_format.bits_per_sample) {
-	case 0:
-		assert(num_samples == 0);
-		break;
-	case 24:
-		convert_fixed24_to_fp32(&audio[0], num_channels, data, audio_format.num_channels, num_samples);
-		break;
-	case 32:
-		convert_fixed32_to_fp32(&audio[0], num_channels, data, audio_format.num_channels, num_samples);
-		break;
-	default:
-		fprintf(stderr, "Cannot handle audio with %u bits per sample\n", audio_format.bits_per_sample);
-		assert(false);
+	// Convert the audio to fp32.
+	unique_ptr<float[]> audio(new float[num_samples * num_channels]);
+	unsigned channel_index = 0;
+	for (auto channel_it = device->interesting_channels.cbegin(); channel_it != device->interesting_channels.end(); ++channel_it, ++channel_index) {
+		switch (audio_format.bits_per_sample) {
+		case 0:
+			assert(num_samples == 0);
+			break;
+		case 16:
+			convert_fixed16_to_fp32(audio.get(), channel_index, num_channels, data, *channel_it, audio_format.num_channels, num_samples);
+			break;
+		case 24:
+			convert_fixed24_to_fp32(audio.get(), channel_index, num_channels, data, *channel_it, audio_format.num_channels, num_samples);
+			break;
+		case 32:
+			convert_fixed32_to_fp32(audio.get(), channel_index, num_channels, data, *channel_it, audio_format.num_channels, num_samples);
+			break;
+		default:
+			fprintf(stderr, "Cannot handle audio with %u bits per sample\n", audio_format.bits_per_sample);
+			assert(false);
+		}
 	}
 
 	// Now add it.
-	int64_t local_pts = card->next_local_pts;
-	card->resampling_queue->add_input_samples(local_pts / double(TIMEBASE), audio.data(), num_samples);
-	card->next_local_pts = local_pts + frame_length;
+	int64_t local_pts = device->next_local_pts;
+	device->resampling_queue->add_input_samples(local_pts / double(TIMEBASE), audio.get(), num_samples);
+	device->next_local_pts = local_pts + frame_length;
+	return true;
 }
 
-void AudioMixer::add_silence(unsigned card_index, unsigned samples_per_frame, unsigned num_frames, int64_t frame_length)
+bool AudioMixer::add_silence(DeviceSpec device_spec, unsigned samples_per_frame, unsigned num_frames, int64_t frame_length)
 {
-	CaptureCard *card = &cards[card_index];
-	lock_guard<mutex> lock(audio_mutex);
+	AudioDevice *device = find_audio_device(device_spec);
 
-	if (card->resampling_queue == nullptr) {
-		// No inputs use this card; throw it away.
-		return;
+	unique_lock<timed_mutex> lock(audio_mutex, defer_lock);
+	if (!lock.try_lock_for(chrono::milliseconds(10))) {
+		return false;
+	}
+	if (device->resampling_queue == nullptr) {
+		// No buses use this device; throw it away.
+		return true;
 	}
 
-	unsigned num_channels = card->interesting_channels.size();
+	unsigned num_channels = device->interesting_channels.size();
 	assert(num_channels > 0);
 
 	vector<float> silence(samples_per_frame * num_channels, 0.0f);
 	for (unsigned i = 0; i < num_frames; ++i) {
-		card->resampling_queue->add_input_samples(card->next_local_pts / double(TIMEBASE), silence.data(), samples_per_frame);
+		device->resampling_queue->add_input_samples(device->next_local_pts / double(TIMEBASE), silence.data(), samples_per_frame);
 		// Note that if the format changed in the meantime, we have
 		// no way of detecting that; we just have to assume the frame length
 		// is always the same.
-		card->next_local_pts += frame_length;
+		device->next_local_pts += frame_length;
 	}
+	return true;
 }
 
-void AudioMixer::find_sample_src_from_capture_card(const vector<float> *samples_card, unsigned card_index, int source_channel, const float **srcptr, unsigned *stride)
+AudioMixer::AudioDevice *AudioMixer::find_audio_device(DeviceSpec device)
+{
+	switch (device.type) {
+	case InputSourceType::CAPTURE_CARD:
+		return &video_cards[device.index];
+	case InputSourceType::ALSA_INPUT:
+		return &alsa_inputs[device.index];
+	case InputSourceType::SILENCE:
+	default:
+		assert(false);
+	}
+	return nullptr;
+}
+
+// Get a pointer to the given channel from the given device.
+// The channel must be picked out earlier and resampled.
+void AudioMixer::find_sample_src_from_device(const map<DeviceSpec, vector<float>> &samples_card, DeviceSpec device_spec, int source_channel, const float **srcptr, unsigned *stride)
 {
 	static float zero = 0.0f;
-	if (source_channel == -1) {
+	if (source_channel == -1 || device_spec.type == InputSourceType::SILENCE) {
 		*srcptr = &zero;
 		*stride = 0;
 		return;
 	}
-	// FIXME: map back through the interesting_channels squeeze map instead of using source_channel
-	// directly, which will be wrong (and might even overrun).
-	*srcptr = &samples_card[card_index][source_channel];
-	*stride = cards[card_index].interesting_channels.size();
+	AudioDevice *device = find_audio_device(device_spec);
+	assert(device->interesting_channels.count(source_channel) != 0);
+	unsigned channel_index = 0;
+	for (int channel : device->interesting_channels) {
+		if (channel == source_channel) break;
+		++channel_index;
+	}
+	assert(channel_index < device->interesting_channels.size());
+	const auto it = samples_card.find(device_spec);
+	assert(it != samples_card.end());
+	*srcptr = &(it->second)[channel_index];
+	*stride = device->interesting_channels.size();
+}
+
+// TODO: Can be SSSE3-optimized if need be.
+void AudioMixer::fill_audio_bus(const map<DeviceSpec, vector<float>> &samples_card, const InputMapping::Bus &bus, unsigned num_samples, float *output)
+{
+	if (bus.device.type == InputSourceType::SILENCE) {
+		memset(output, 0, num_samples * sizeof(*output));
+	} else {
+		assert(bus.device.type == InputSourceType::CAPTURE_CARD ||
+		       bus.device.type == InputSourceType::ALSA_INPUT);
+		const float *lsrc, *rsrc;
+		unsigned lstride, rstride;
+		float *dptr = output;
+		find_sample_src_from_device(samples_card, bus.device, bus.source_channel[0], &lsrc, &lstride);
+		find_sample_src_from_device(samples_card, bus.device, bus.source_channel[1], &rsrc, &rstride);
+		for (unsigned i = 0; i < num_samples; ++i) {
+			*dptr++ = *lsrc;
+			*dptr++ = *rsrc;
+			lsrc += lstride;
+			rsrc += rstride;
+		}
+	}
 }
 
 vector<float> AudioMixer::get_output(double pts, unsigned num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy)
 {
-	vector<float> samples_card[MAX_CARDS];
+	map<DeviceSpec, vector<float>> samples_card;
 	vector<float> samples_bus;
 
-	lock_guard<mutex> lock(audio_mutex);
+	lock_guard<timed_mutex> lock(audio_mutex);
 
 	// Pick out all the interesting channels from all the cards.
-	for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
-		CaptureCard *card = &cards[card_index];
-		if (!card->interesting_channels.empty()) {
-			samples_card[card_index].resize(num_samples * card->interesting_channels.size());
-			card->resampling_queue->get_output_samples(
+	// TODO: If the card has been hotswapped, the number of channels
+	// might have changed; if so, we need to do some sort of remapping
+	// to silence.
+	for (const auto &spec_and_info : get_devices_mutex_held()) {
+		const DeviceSpec &device_spec = spec_and_info.first;
+		AudioDevice *device = find_audio_device(device_spec);
+		if (!device->interesting_channels.empty()) {
+			samples_card[device_spec].resize(num_samples * device->interesting_channels.size());
+			device->resampling_queue->get_output_samples(
 				pts,
-				&samples_card[card_index][0],
+				&samples_card[device_spec][0],
 				num_samples,
 				rate_adjustment_policy);
 		}
 	}
 
-	// TODO: Move lo-cut etc. into each bus.
-	vector<float> samples_out;
+	vector<float> samples_out, left, right;
 	samples_out.resize(num_samples * 2);
 	samples_bus.resize(num_samples * 2);
-	for (unsigned input_index = 0; input_index < input_mapping.inputs.size(); ++input_index) {
-		const InputMapping::Input &input = input_mapping.inputs[input_index];
-		if (input.input_source_type == InputSourceType::SILENCE) {
-			memset(&samples_bus[0], 0, samples_bus.size() * sizeof(samples_bus[0]));
-		} else {
-			// TODO: Move this into its own function. Can be SSSE3-optimized if need be.
-			assert(input.input_source_type == InputSourceType::CAPTURE_CARD);
-			const float *lsrc, *rsrc;
-			unsigned lstride, rstride;
-			float *dptr = &samples_bus[0];
-			find_sample_src_from_capture_card(samples_card, input.input_source_index, input.source_channel[0], &lsrc, &lstride);
-			find_sample_src_from_capture_card(samples_card, input.input_source_index, input.source_channel[1], &rsrc, &rstride);
-			for (unsigned i = 0; i < num_samples; ++i) {
-				*dptr++ = *lsrc;
-				*dptr++ = *rsrc;
-				lsrc += lstride;
-				rsrc += rstride;
+	for (unsigned bus_index = 0; bus_index < input_mapping.buses.size(); ++bus_index) {
+		fill_audio_bus(samples_card, input_mapping.buses[bus_index], num_samples, &samples_bus[0]);
+
+		// Cut away everything under 120 Hz (or whatever the cutoff is);
+		// we don't need it for voice, and it will reduce headroom
+		// and confuse the compressor. (In particular, any hums at 50 or 60 Hz
+		// should be dampened.)
+		if (locut_enabled[bus_index]) {
+			locut[bus_index].render(samples_bus.data(), samples_bus.size() / 2, locut_cutoff_hz * 2.0 * M_PI / OUTPUT_FREQUENCY, 0.5f);
+		}
+
+		{
+			lock_guard<mutex> lock(compressor_mutex);
+
+			// Apply a level compressor to get the general level right.
+			// Basically, if it's over about -40 dBFS, we squeeze it down to that level
+			// (or more precisely, near it, since we don't use infinite ratio),
+			// then apply a makeup gain to get it to -14 dBFS. -14 dBFS is, of course,
+			// entirely arbitrary, but from practical tests with speech, it seems to
+			// put ut around -23 LUFS, so it's a reasonable starting point for later use.
+			if (level_compressor_enabled[bus_index]) {
+				float threshold = 0.01f;   // -40 dBFS.
+				float ratio = 20.0f;
+				float attack_time = 0.5f;
+				float release_time = 20.0f;
+				float makeup_gain = from_db(ref_level_dbfs - (-40.0f));  // +26 dB.
+				level_compressor[bus_index]->process(samples_bus.data(), samples_bus.size() / 2, threshold, ratio, attack_time, release_time, makeup_gain);
+				gain_staging_db[bus_index] = to_db(level_compressor[bus_index]->get_attenuation() * makeup_gain);
+			} else {
+				// Just apply the gain we already had.
+				float g = from_db(gain_staging_db[bus_index]);
+				for (size_t i = 0; i < samples_bus.size(); ++i) {
+					samples_bus[i] *= g;
+				}
+			}
+
+#if 0
+			printf("level=%f (%+5.2f dBFS) attenuation=%f (%+5.2f dB) end_result=%+5.2f dB\n",
+				level_compressor.get_level(), to_db(level_compressor.get_level()),
+				level_compressor.get_attenuation(), to_db(level_compressor.get_attenuation()),
+				to_db(level_compressor.get_level() * level_compressor.get_attenuation() * makeup_gain));
+#endif
+
+			// The real compressor.
+			if (compressor_enabled[bus_index]) {
+				float threshold = from_db(compressor_threshold_dbfs[bus_index]);
+				float ratio = 20.0f;
+				float attack_time = 0.005f;
+				float release_time = 0.040f;
+				float makeup_gain = 2.0f;  // +6 dB.
+				compressor[bus_index]->process(samples_bus.data(), samples_bus.size() / 2, threshold, ratio, attack_time, release_time, makeup_gain);
+		//		compressor_att = compressor.get_attenuation();
 			}
 		}
 
-		float volume = from_db(fader_volume_db[input_index]);
-		if (input_index == 0) {
+		float volume = from_db(fader_volume_db[bus_index]);
+		if (bus_index == 0) {
 			for (unsigned i = 0; i < num_samples * 2; ++i) {
 				samples_out[i] = samples_bus[i] * volume;
 			}
@@ -221,63 +472,14 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
 				samples_out[i] += samples_bus[i] * volume;
 			}
 		}
-	}
 
-	// Cut away everything under 120 Hz (or whatever the cutoff is);
-	// we don't need it for voice, and it will reduce headroom
-	// and confuse the compressor. (In particular, any hums at 50 or 60 Hz
-	// should be dampened.)
-	if (locut_enabled) {
-		locut.render(samples_out.data(), samples_out.size() / 2, locut_cutoff_hz * 2.0 * M_PI / OUTPUT_FREQUENCY, 0.5f);
+		deinterleave_samples(samples_bus, &left, &right);
+		measure_bus_levels(bus_index, left, right, volume);
 	}
 
 	{
 		lock_guard<mutex> lock(compressor_mutex);
 
-		// Apply a level compressor to get the general level right.
-		// Basically, if it's over about -40 dBFS, we squeeze it down to that level
-		// (or more precisely, near it, since we don't use infinite ratio),
-		// then apply a makeup gain to get it to -14 dBFS. -14 dBFS is, of course,
-		// entirely arbitrary, but from practical tests with speech, it seems to
-		// put ut around -23 LUFS, so it's a reasonable starting point for later use.
-		{
-			if (level_compressor_enabled) {
-				float threshold = 0.01f;   // -40 dBFS.
-				float ratio = 20.0f;
-				float attack_time = 0.5f;
-				float release_time = 20.0f;
-				float makeup_gain = from_db(ref_level_dbfs - (-40.0f));  // +26 dB.
-				level_compressor.process(samples_out.data(), samples_out.size() / 2, threshold, ratio, attack_time, release_time, makeup_gain);
-				gain_staging_db = to_db(level_compressor.get_attenuation() * makeup_gain);
-			} else {
-				// Just apply the gain we already had.
-				float g = from_db(gain_staging_db);
-				for (size_t i = 0; i < samples_out.size(); ++i) {
-					samples_out[i] *= g;
-				}
-			}
-		}
-
-	#if 0
-		printf("level=%f (%+5.2f dBFS) attenuation=%f (%+5.2f dB) end_result=%+5.2f dB\n",
-			level_compressor.get_level(), to_db(level_compressor.get_level()),
-			level_compressor.get_attenuation(), to_db(level_compressor.get_attenuation()),
-			to_db(level_compressor.get_level() * level_compressor.get_attenuation() * makeup_gain));
-	#endif
-
-	//	float limiter_att, compressor_att;
-
-		// The real compressor.
-		if (compressor_enabled) {
-			float threshold = from_db(compressor_threshold_dbfs);
-			float ratio = 20.0f;
-			float attack_time = 0.005f;
-			float release_time = 0.040f;
-			float makeup_gain = 2.0f;  // +6 dB.
-			compressor.process(samples_out.data(), samples_out.size() / 2, threshold, ratio, attack_time, release_time, makeup_gain);
-	//		compressor_att = compressor.get_attenuation();
-		}
-
 		// Finally a limiter at -4 dB (so, -10 dBFS) to take out the worst peaks only.
 		// Note that since ratio is not infinite, we could go slightly higher than this.
 		if (limiter_enabled) {
@@ -293,7 +495,8 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
 	//	printf("limiter=%+5.1f  compressor=%+5.1f\n", to_db(limiter_att), to_db(compressor_att));
 	}
 
-	// At this point, we are most likely close to +0 LU, but all of our
+	// At this point, we are most likely close to +0 LU (at least if the
+	// faders sum to 0 dB and the compressors are on), but all of our
 	// measurements have been on raw sample values, not R128 values.
 	// So we have a final makeup gain to get us to +0 LU; the gain
 	// adjustments required should be relatively small, and also, the
@@ -305,7 +508,7 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
 	// Note that there's a feedback loop here, so we choose a very slow filter
 	// (half-time of 30 seconds).
 	double target_loudness_factor, alpha;
-	double loudness_lu = loudness_lufs - ref_level_lufs;
+	double loudness_lu = r128.loudness_M() - ref_level_lufs;
 	double current_makeup_lu = to_db(final_makeup_gain);
 	target_loudness_factor = final_makeup_gain * from_db(-loudness_lu);
 
@@ -333,48 +536,186 @@ vector<float> AudioMixer::get_output(double pts, unsigned num_samples, Resamplin
 		final_makeup_gain = m;
 	}
 
+	update_meters(samples_out);
+
 	return samples_out;
 }
 
-vector<string> AudioMixer::get_names() const
+void AudioMixer::measure_bus_levels(unsigned bus_index, const vector<float> &left, const vector<float> &right, float volume)
+{
+	assert(left.size() == right.size());
+	const float peak_levels[2] = {
+		find_peak(left.data(), left.size()) * volume,
+		find_peak(right.data(), right.size()) * volume
+	};
+	for (unsigned channel = 0; channel < 2; ++channel) {
+		// Compute the current value, including hold and falloff.
+		// The constants are borrowed from zita-mu1 by Fons Adriaensen.
+		static constexpr float hold_sec = 0.5f;
+		static constexpr float falloff_db_sec = 15.0f;  // dB/sec falloff after hold.
+		float current_peak;
+		PeakHistory &history = peak_history[bus_index][channel];
+		if (history.age_seconds < hold_sec) {
+			current_peak = history.last_peak;
+		} else {
+			current_peak = history.last_peak * from_db(-falloff_db_sec * (history.age_seconds - hold_sec));
+		}
+
+		// See if we have a new peak to replace the old (possibly falling) one.
+		if (peak_levels[channel] > current_peak) {
+			history.last_peak = peak_levels[channel];
+			history.age_seconds = 0.0f;  // Not 100% correct, but more than good enough given our frame sizes.
+			current_peak = peak_levels[channel];
+		} else {
+			history.age_seconds += float(left.size()) / OUTPUT_FREQUENCY;
+		}
+		history.current_level = peak_levels[channel];
+		history.current_peak = current_peak;
+	}
+}
+
+void AudioMixer::update_meters(const vector<float> &samples)
+{
+	// Upsample 4x to find interpolated peak.
+	peak_resampler.inp_data = const_cast<float *>(samples.data());
+	peak_resampler.inp_count = samples.size() / 2;
+
+	vector<float> interpolated_samples;
+	interpolated_samples.resize(samples.size());
+	{
+		lock_guard<mutex> lock(audio_measure_mutex);
+
+		while (peak_resampler.inp_count > 0) {  // About four iterations.
+			peak_resampler.out_data = &interpolated_samples[0];
+			peak_resampler.out_count = interpolated_samples.size() / 2;
+			peak_resampler.process();
+			size_t out_stereo_samples = interpolated_samples.size() / 2 - peak_resampler.out_count;
+			peak = max<float>(peak, find_peak(interpolated_samples.data(), out_stereo_samples * 2));
+			peak_resampler.out_data = nullptr;
+		}
+	}
+
+	// Find R128 levels and L/R correlation.
+	vector<float> left, right;
+	deinterleave_samples(samples, &left, &right);
+	float *ptrs[] = { left.data(), right.data() };
+	{
+		lock_guard<mutex> lock(audio_measure_mutex);
+		r128.process(left.size(), ptrs);
+		correlation.process_samples(samples);
+	}
+
+	send_audio_level_callback();
+}
+
+void AudioMixer::reset_meters()
+{
+	lock_guard<mutex> lock(audio_measure_mutex);
+	peak_resampler.reset();
+	peak = 0.0f;
+	r128.reset();
+	r128.integr_start();
+	correlation.reset();
+}
+
+void AudioMixer::send_audio_level_callback()
+{
+	if (audio_level_callback == nullptr) {
+		return;
+	}
+
+	lock_guard<mutex> lock(audio_measure_mutex);
+	double loudness_s = r128.loudness_S();
+	double loudness_i = r128.integrated();
+	double loudness_range_low = r128.range_min();
+	double loudness_range_high = r128.range_max();
+
+	vector<BusLevel> bus_levels;
+	bus_levels.resize(input_mapping.buses.size());
+	{
+		lock_guard<mutex> lock(compressor_mutex);
+		for (unsigned bus_index = 0; bus_index < bus_levels.size(); ++bus_index) {
+			bus_levels[bus_index].current_level_dbfs[0] = to_db(peak_history[bus_index][0].current_level);
+			bus_levels[bus_index].current_level_dbfs[1] = to_db(peak_history[bus_index][1].current_level);
+			bus_levels[bus_index].peak_level_dbfs[0] = to_db(peak_history[bus_index][0].current_peak);
+			bus_levels[bus_index].peak_level_dbfs[1] = to_db(peak_history[bus_index][1].current_peak);
+			bus_levels[bus_index].gain_staging_db = gain_staging_db[bus_index];
+			if (compressor_enabled[bus_index]) {
+				bus_levels[bus_index].compressor_attenuation_db = -to_db(compressor[bus_index]->get_attenuation());
+			} else {
+				bus_levels[bus_index].compressor_attenuation_db = 0.0;
+			}
+		}
+	}
+
+	audio_level_callback(loudness_s, to_db(peak), bus_levels,
+		loudness_i, loudness_range_low, loudness_range_high,
+		to_db(final_makeup_gain),
+		correlation.get_correlation());
+}
+
+map<DeviceSpec, DeviceInfo> AudioMixer::get_devices() const
+{
+	lock_guard<timed_mutex> lock(audio_mutex);
+	return get_devices_mutex_held();
+}
+
+map<DeviceSpec, DeviceInfo> AudioMixer::get_devices_mutex_held() const
 {
-	lock_guard<mutex> lock(audio_mutex);
-	vector<string> names;
+	map<DeviceSpec, DeviceInfo> devices;
 	for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
-		const CaptureCard *card = &cards[card_index];
-		names.push_back(card->name);
+		const DeviceSpec spec{ InputSourceType::CAPTURE_CARD, card_index };
+		const AudioDevice *device = &video_cards[card_index];
+		DeviceInfo info;
+		info.name = device->name;
+		info.num_channels = 8;  // FIXME: This is wrong for fake cards.
+		devices.insert(make_pair(spec, info));
 	}
-	return names;
+	for (unsigned card_index = 0; card_index < available_alsa_cards.size(); ++card_index) {
+		const DeviceSpec spec{ InputSourceType::ALSA_INPUT, card_index };
+		const ALSAInput::Device &device = available_alsa_cards[card_index];
+		DeviceInfo info;
+		info.name = device.name + " (" + device.info + ")";
+		info.num_channels = device.num_channels;
+		devices.insert(make_pair(spec, info));
+	}
+	return devices;
 }
 
-void AudioMixer::set_name(unsigned card_index, const string &name)
+void AudioMixer::set_name(DeviceSpec device_spec, const string &name)
 {
-	lock_guard<mutex> lock(audio_mutex);
-	CaptureCard *card = &cards[card_index];
-	card->name = name;
+	AudioDevice *device = find_audio_device(device_spec);
+
+	lock_guard<timed_mutex> lock(audio_mutex);
+	device->name = name;
 }
 
 void AudioMixer::set_input_mapping(const InputMapping &new_input_mapping)
 {
-	lock_guard<mutex> lock(audio_mutex);
+	lock_guard<timed_mutex> lock(audio_mutex);
 
-	map<unsigned, set<unsigned>> interesting_channels;
-	for (const InputMapping::Input &input : new_input_mapping.inputs) {
-		if (input.input_source_type == InputSourceType::CAPTURE_CARD) {
+	map<DeviceSpec, set<unsigned>> interesting_channels;
+	for (const InputMapping::Bus &bus : new_input_mapping.buses) {
+		if (bus.device.type == InputSourceType::CAPTURE_CARD ||
+		    bus.device.type == InputSourceType::ALSA_INPUT) {
 			for (unsigned channel = 0; channel < 2; ++channel) {
-				if (input.source_channel[channel] != -1) {
-					interesting_channels[input.input_source_index].insert(input.source_channel[channel]);
+				if (bus.source_channel[channel] != -1) {
+					interesting_channels[bus.device].insert(bus.source_channel[channel]);
 				}
 			}
 		}
 	}
 
 	// Reset resamplers for all cards that don't have the exact same state as before.
-	for (unsigned card_index = 0; card_index < num_cards; ++card_index) {
-		CaptureCard *card = &cards[card_index];
-		if (card->interesting_channels != interesting_channels[card_index]) {
-			card->interesting_channels = interesting_channels[card_index];
-			reset_card_mutex_held(card_index);
+	for (const auto &spec_and_info : get_devices_mutex_held()) {
+		const DeviceSpec &device_spec = spec_and_info.first;
+		AudioDevice *device = find_audio_device(device_spec);
+		if (device->interesting_channels != interesting_channels[device_spec]) {
+			device->interesting_channels = interesting_channels[device_spec];
+			if (device_spec.type == InputSourceType::ALSA_INPUT) {
+				reset_alsa_mutex_held(device_spec);
+			}
+			reset_resampler_mutex_held(device_spec);
 		}
 	}
 
@@ -383,6 +724,6 @@ void AudioMixer::set_input_mapping(const InputMapping &new_input_mapping)
 
 InputMapping AudioMixer::get_input_mapping() const
 {
-	lock_guard<mutex> lock(audio_mutex);
+	lock_guard<timed_mutex> lock(audio_mutex);
 	return input_mapping;
 }