git.sesse.net Git - nageru/blob - nageru/resampling_queue.cpp

   1 // Parts of the code is adapted from Adriaensen's project Zita-ajbridge
   2 // (as of November 2015), although it has been heavily reworked for this use
   3 // case. Original copyright follows:
   4 //
   5 //  Copyright (C) 2012-2015 Fons Adriaensen <fons@linuxaudio.org>
   6 //
   7 //  This program is free software; you can redistribute it and/or modify
   8 //  it under the terms of the GNU General Public License as published by
   9 //  the Free Software Foundation; either version 3 of the License, or
  10 //  (at your option) any later version.
  11 //
  12 //  This program is distributed in the hope that it will be useful,
  13 //  but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 //  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 //  GNU General Public License for more details.
  16 //
  17 //  You should have received a copy of the GNU General Public License
  18 //  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  19
  20 #include "resampling_queue.h"
  21
  22 #include <assert.h>
  23 #include <chrono>
  24 #include <math.h>
  25 #include <stdio.h>
  26 #include <stdlib.h>
  27 #include <string.h>
  28 #include <string>
  29 #include <sys/types.h>
  30 #include <zita-resampler/vresampler.h>
  31 #include <algorithm>
  32
  33 #include "shared/shared_defs.h"
  34
  35 using namespace std;
  36 using namespace std::chrono;
  37
  38 ResamplingQueue::ResamplingQueue(const std::string &debug_description, unsigned freq_in, unsigned freq_out, unsigned num_channels, double expected_delay_seconds)
  39         : debug_description(debug_description), freq_in(freq_in), freq_out(freq_out), num_channels(num_channels),
  40           current_estimated_freq_in(freq_in),
  41           ratio(double(freq_out) / double(freq_in)), expected_delay(expected_delay_seconds * OUTPUT_FREQUENCY)
  42 {
  43         vresampler.setup(ratio, num_channels, /*hlen=*/32);
  44
  45         // Prime the resampler so there's no more delay.
  46         vresampler.inp_count = vresampler.inpsize() / 2 - 1;
  47         vresampler.out_count = 1048576;
  48         vresampler.process ();
  49 }
  50
  51 void ResamplingQueue::add_input_samples(steady_clock::time_point ts, const float *samples, ssize_t num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy)
  52 {
  53         if (num_samples == 0) {
  54                 return;
  55         }
  56
  57         assert(duration<double>(ts.time_since_epoch()).count() >= 0.0);
  58
  59         bool good_sample = (rate_adjustment_policy == ADJUST_RATE);
  60         if (good_sample && a1.good_sample) {
  61                 a0 = a1;
  62         }
  63         a1.ts = ts;
  64         a1.input_samples_received += num_samples;
  65         a1.good_sample = good_sample;
  66         if (a0.good_sample && a1.good_sample) {
  67                 current_estimated_freq_in = (a1.input_samples_received - a0.input_samples_received) / duration<double>(a1.ts - a0.ts).count();
  68                 if (!(current_estimated_freq_in >= 0.0)) {
  69                         fprintf(stderr, "%s: PANIC: Input audio clock going backwards, ignoring.\n",
  70                                 debug_description.c_str());
  71                         current_estimated_freq_in = freq_in;
  72                 }
  73
  74                 // Bound the frequency, so that a single wild result won't throw the filter off guard.
  75                 current_estimated_freq_in = min(current_estimated_freq_in, 1.2 * freq_in);
  76                 current_estimated_freq_in = max(current_estimated_freq_in, 0.8 * freq_in);
  77         }
  78
  79         buffer.insert(buffer.end(), samples, samples + num_samples * num_channels);
  80 }
  81
  82 bool ResamplingQueue::get_output_samples(steady_clock::time_point ts, float *samples, ssize_t num_samples, ResamplingQueue::RateAdjustmentPolicy rate_adjustment_policy)
  83 {
  84         assert(num_samples > 0);
  85         if (a1.input_samples_received == 0) {
  86                 // No data yet, just return zeros.
  87                 memset(samples, 0, num_samples * num_channels * sizeof(float));
  88                 return true;
  89         }
  90
  91         // This can happen when we get dropped frames on the master card.
  92         if (duration<double>(ts.time_since_epoch()).count() <= 0.0) {
  93                 rate_adjustment_policy = DO_NOT_ADJUST_RATE;
  94         }
  95
  96         if (rate_adjustment_policy == ADJUST_RATE && (a0.good_sample || a1.good_sample)) {
  97                 // Estimate the current number of input samples produced at
  98                 // this instant in time, by extrapolating from the last known
  99                 // good point. Note that we could be extrapolating backward or
 100                 // forward, depending on the timing of the calls.
 101                 const InputPoint &base_point = a1.good_sample ? a1 : a0;
 102                 assert(duration<double>(base_point.ts.time_since_epoch()).count() >= 0.0);
 103
 104                 // NOTE: Due to extrapolation, input_samples_received can
 105                 // actually go negative here the few first calls (ie., we asked
 106                 // about a timestamp where we hadn't actually started producing
 107                 // samples yet), but that is harmless.
 108                 const double input_samples_received = base_point.input_samples_received +
 109                         current_estimated_freq_in * duration<double>(ts - base_point.ts).count();
 110
 111                 // Estimate the number of input samples _consumed_ after we've run the resampler.
 112                 const double input_samples_consumed = total_consumed_samples +
 113                         num_samples / (ratio * rcorr);
 114
 115                 double actual_delay = input_samples_received - input_samples_consumed;
 116                 actual_delay += vresampler.inpdist();    // Delay in the resampler itself.
 117                 double err = actual_delay - expected_delay;
 118                 if (first_output) {
 119                         // Before the very first block, insert artificial delay based on our initial estimate,
 120                         // so that we don't need a long period to stabilize at the beginning.
 121                         if (err < 0.0) {
 122                                 int delay_samples_to_add = lrintf(-err);
 123                                 for (ssize_t i = 0; i < delay_samples_to_add * int(num_channels); ++i) {
 124                                         buffer.push_front(0.0f);
 125                                 }
 126                                 total_consumed_samples -= delay_samples_to_add;  // Equivalent to increasing input_samples_received on a0 and a1.
 127                                 err += delay_samples_to_add;
 128                         } else if (err > 0.0) {
 129                                 int delay_samples_to_remove = min<int>(lrintf(err), buffer.size() / num_channels);
 130                                 buffer.erase(buffer.begin(), buffer.begin() + delay_samples_to_remove * num_channels);
 131                                 total_consumed_samples += delay_samples_to_remove;
 132                                 err -= delay_samples_to_remove;
 133                         }
 134                 }
 135                 first_output = false;
 136
 137                 // Compute loop filter coefficients for the two filters. We need to compute them
 138                 // every time, since they depend on the number of samples the user asked for.
 139                 //
 140                 // The loop bandwidth is at 0.02 Hz; our jitter is pretty large
 141                 // since none of the threads involved run at real-time priority.
 142                 // However, the first four seconds, we use a larger loop bandwidth (2 Hz),
 143                 // because there's a lot going on during startup, and thus the
 144                 // initial estimate might be tainted by jitter during that phase,
 145                 // and we want to converge faster.
 146                 //
 147                 // NOTE: The above logic might only hold during Nageru startup
 148                 // (we start ResamplingQueues also when we e.g. switch sound sources),
 149                 // but in general, a little bit of increased timing jitter is acceptable
 150                 // right after a setup change like this.
 151                 double loop_bandwidth_hz = (total_consumed_samples < 4 * int(freq_in)) ? 0.2 : 0.02;
 152
 153                 // Set filters. The first filter much wider than the first one (20x as wide).
 154                 double w = (2.0 * M_PI) * loop_bandwidth_hz * num_samples / freq_out;
 155                 double w0 = 1.0 - exp(-20.0 * w);
 156                 double w1 = w * 1.5 / num_samples / ratio;
 157                 double w2 = w / 1.5;
 158
 159                 // Filter <err> through the loop filter to find the correction ratio.
 160                 z1 += w0 * (w1 * err - z1);
 161                 z2 += w0 * (z1 - z2);
 162                 z3 += w2 * z2;
 163                 rcorr = 1.0 - z2 - z3;
 164                 if (rcorr > 1.05) rcorr = 1.05;
 165                 if (rcorr < 0.95) rcorr = 0.95;
 166                 assert(!isnan(rcorr));
 167                 vresampler.set_rratio(rcorr);
 168         }
 169
 170         // Finally actually resample, producing exactly <num_samples> output samples.
 171         vresampler.out_data = samples;
 172         vresampler.out_count = num_samples;
 173         while (vresampler.out_count > 0) {
 174                 if (buffer.empty()) {
 175                         // This should never happen unless delay is set way too low,
 176                         // or we're dropping a lot of data.
 177                         fprintf(stderr, "%s: PANIC: Out of input samples to resample, still need %d output samples! (correction factor is %f)\n",
 178                                 debug_description.c_str(), int(vresampler.out_count), rcorr);
 179                         memset(vresampler.out_data, 0, vresampler.out_count * num_channels * sizeof(float));
 180
 181                         // Reset the loop filter.
 182                         z1 = z2 = z3 = 0.0;
 183
 184                         return false;
 185                 }
 186
 187                 float inbuf[1024];
 188                 size_t num_input_samples = sizeof(inbuf) / (sizeof(float) * num_channels);
 189                 if (num_input_samples * num_channels > buffer.size()) {
 190                         num_input_samples = buffer.size() / num_channels;
 191                 }
 192                 copy(buffer.begin(), buffer.begin() + num_input_samples * num_channels, inbuf);
 193
 194                 vresampler.inp_count = num_input_samples;
 195                 vresampler.inp_data = inbuf;
 196
 197                 int err = vresampler.process();
 198                 assert(err == 0);
 199
 200                 size_t consumed_samples = num_input_samples - vresampler.inp_count;
 201                 total_consumed_samples += consumed_samples;
 202                 buffer.erase(buffer.begin(), buffer.begin() + consumed_samples * num_channels);
 203         }
 204         return true;
 205 }