Add normaliser

2024-12-18 17:11:53 +00:00 · 2023-06-21 20:48:02 -05:00 · 2023-06-21 20:48:02 -05:00 · 375f83797a
commit 375f83797a
parent 3b64f25286
2 changed files with 354 additions and 0 deletions
--- a/playback/src/lib.rs
+++ b/playback/src/lib.rs
@ -11,12 +11,23 @@ pub mod convert;
 pub mod decoder;
 pub mod dither;
 pub mod mixer;
+pub mod normaliser;
 pub mod player;
 pub mod resampler;

+pub const DB_VOLTAGE_RATIO: f64 = 20.0;
+pub const PCM_AT_0DBFS: f64 = 1.0;
 pub const RESAMPLER_INPUT_SIZE: usize = 147;
 pub const SAMPLE_RATE: u32 = 44100;
 pub const NUM_CHANNELS: u8 = 2;
 pub const SAMPLES_PER_SECOND: u32 = SAMPLE_RATE * NUM_CHANNELS as u32;
 pub const PAGES_PER_MS: f64 = SAMPLE_RATE as f64 / 1000.0;
 pub const MS_PER_PAGE: f64 = 1000.0 / SAMPLE_RATE as f64;
+
+pub fn db_to_ratio(db: f64) -> f64 {
+    f64::powf(10.0, db / DB_VOLTAGE_RATIO)
+}
+
+pub fn ratio_to_db(ratio: f64) -> f64 {
+    ratio.log10() * DB_VOLTAGE_RATIO
+}
--- a/playback/src/normaliser.rs
+++ b/playback/src/normaliser.rs
@ -0,0 +1,343 @@
+use crate::{
+    config::{NormalisationMethod, NormalisationType, PlayerConfig},
+    db_to_ratio,
+    decoder::AudioPacket,
+    mixer::VolumeGetter,
+    player::NormalisationData,
+    ratio_to_db, PCM_AT_0DBFS,
+};
+
+struct NoNormalisation;
+
+impl NoNormalisation {
+    fn normalise(samples: &[f64], volume: f64) -> Vec<f64> {
+        if volume < 1.0 {
+            let mut output = Vec::with_capacity(samples.len());
+
+            output.extend(samples.iter().map(|sample| sample * volume));
+
+            output
+        } else {
+            samples.to_vec()
+        }
+    }
+}
+
+struct BasicNormalisation;
+
+impl BasicNormalisation {
+    fn normalise(samples: &[f64], volume: f64, factor: f64) -> Vec<f64> {
+        if volume < 1.0 || factor < 1.0 {
+            let mut output = Vec::with_capacity(samples.len());
+
+            output.extend(samples.iter().map(|sample| sample * factor * volume));
+
+            output
+        } else {
+            samples.to_vec()
+        }
+    }
+}
+
+#[derive(PartialEq)]
+struct DynamicNormalisation {
+    threshold_db: f64,
+    attack_cf: f64,
+    release_cf: f64,
+    knee_db: f64,
+    integrator: f64,
+    peak: f64,
+}
+
+impl DynamicNormalisation {
+    fn new(config: &PlayerConfig) -> Self {
+        // as_millis() has rounding errors (truncates)
+        debug!(
+            "Normalisation Attack: {:.0} ms",
+            config
+                .sample_rate
+                .normalisation_coefficient_to_duration(config.normalisation_attack_cf)
+                .as_secs_f64()
+                * 1000.
+        );
+
+        debug!(
+            "Normalisation Release: {:.0} ms",
+            config
+                .sample_rate
+                .normalisation_coefficient_to_duration(config.normalisation_release_cf)
+                .as_secs_f64()
+                * 1000.
+        );
+
+        Self {
+            threshold_db: config.normalisation_threshold_dbfs,
+            attack_cf: config.normalisation_attack_cf,
+            release_cf: config.normalisation_release_cf,
+            knee_db: config.normalisation_knee_db,
+            integrator: 0.0,
+            peak: 0.0,
+        }
+    }
+
+    fn stop(&mut self) {
+        self.integrator = 0.0;
+        self.peak = 0.0;
+    }
+
+    fn normalise(&mut self, samples: &[f64], volume: f64, factor: f64) -> Vec<f64> {
+        let mut output = Vec::with_capacity(samples.len());
+
+        output.extend(samples.iter().map(|sample| {
+            let mut sample = sample * factor;
+
+            // Feedforward limiter in the log domain
+            // After: Giannoulis, D., Massberg, M., & Reiss, J.D. (2012). Digital Dynamic
+            // Range Compressor Design—A Tutorial and Analysis. Journal of The Audio
+            // Engineering Society, 60, 399-408.
+
+            // Some tracks have samples that are precisely 0.0. That's silence
+            // and we know we don't need to limit that, in which we can spare
+            // the CPU cycles.
+            //
+            // Also, calling `ratio_to_db(0.0)` returns `inf` and would get the
+            // peak detector stuck. Also catch the unlikely case where a sample
+            // is decoded as `NaN` or some other non-normal value.
+            let limiter_db = if sample.is_normal() {
+                // step 1-4: half-wave rectification and conversion into dB
+                // and gain computer with soft knee and subtractor
+                let bias_db = ratio_to_db(sample.abs()) - self.threshold_db;
+                let knee_boundary_db = bias_db * 2.0;
+
+                if knee_boundary_db < -self.knee_db {
+                    0.0
+                } else if knee_boundary_db.abs() <= self.knee_db {
+                    // The textbook equation:
+                    // ratio_to_db(sample.abs()) - (ratio_to_db(sample.abs()) - (bias_db + knee_db / 2.0).powi(2) / (2.0 * knee_db))
+                    // Simplifies to:
+                    // ((2.0 * bias_db) + knee_db).powi(2) / (8.0 * knee_db)
+                    // Which in our case further simplifies to:
+                    // (knee_boundary_db + knee_db).powi(2) / (8.0 * knee_db)
+                    // because knee_boundary_db is 2.0 * bias_db.
+                    (knee_boundary_db + self.knee_db).powi(2) / (8.0 * self.knee_db)
+                } else {
+                    // Textbook:
+                    // ratio_to_db(sample.abs()) - threshold_db, which is already our bias_db.
+                    bias_db
+                }
+            } else {
+                0.0
+            };
+
+            // Spare the CPU unless (1) the limiter is engaged, (2) we
+            // were in attack or (3) we were in release, and that attack/
+            // release wasn't finished yet.
+            if limiter_db > 0.0 || self.integrator > 0.0 || self.peak > 0.0 {
+                // step 5: smooth, decoupled peak detector
+                // Textbook:
+                // release_cf * integrator + (1.0 - release_cf) * limiter_db
+                // Simplifies to:
+                // release_cf * integrator - release_cf * limiter_db + limiter_db
+                self.integrator = limiter_db.max(
+                    self.release_cf * self.integrator - self.release_cf * limiter_db + limiter_db,
+                );
+                // Textbook:
+                // attack_cf * peak + (1.0 - attack_cf) * integrator
+                // Simplifies to:
+                // attack_cf * peak - attack_cf * integrator + integrator
+                self.peak =
+                    self.attack_cf * self.peak - self.attack_cf * self.integrator + self.integrator;
+
+                // step 6: make-up gain applied later (volume attenuation)
+                // Applying the standard normalisation factor here won't work,
+                // because there are tracks with peaks as high as 6 dB above
+                // the default threshold, so that would clip.
+
+                // steps 7-8: conversion into level and multiplication into gain stage
+                sample *= db_to_ratio(-self.peak);
+            }
+
+            sample * volume
+        }));
+
+        output
+    }
+}
+
+#[derive(PartialEq)]
+enum Normalisation {
+    None,
+    Basic,
+    Dynamic(DynamicNormalisation),
+}
+
+impl Normalisation {
+    fn new(config: &PlayerConfig) -> Self {
+        if !config.normalisation {
+            Normalisation::None
+        } else {
+            debug!("Normalisation Type: {:?}", config.normalisation_type);
+            debug!(
+                "Normalisation Pregain: {:.1} dB",
+                config.normalisation_pregain_db
+            );
+
+            debug!(
+                "Normalisation Threshold: {:.1} dBFS",
+                config.normalisation_threshold_dbfs
+            );
+
+            debug!("Normalisation Method: {:?}", config.normalisation_method);
+
+            match config.normalisation_method {
+                NormalisationMethod::Dynamic => {
+                    Normalisation::Dynamic(DynamicNormalisation::new(config))
+                }
+                NormalisationMethod::Basic => Normalisation::Basic,
+            }
+        }
+    }
+
+    fn stop(&mut self) {
+        if let Normalisation::Dynamic(ref mut d) = self {
+            d.stop()
+        }
+    }
+
+    fn normalise(&mut self, samples: &[f64], volume: f64, factor: f64) -> Vec<f64> {
+        use Normalisation::*;
+
+        match self {
+            None => NoNormalisation::normalise(samples, volume),
+            Basic => BasicNormalisation::normalise(samples, volume, factor),
+            Dynamic(ref mut d) => d.normalise(samples, volume, factor),
+        }
+    }
+}
+
+pub struct Normaliser {
+    normalisation: Normalisation,
+    volume_getter: Box<dyn VolumeGetter>,
+    normalisation_type: NormalisationType,
+    pregain_db: f64,
+    threshold_dbfs: f64,
+    factor: f64,
+}
+
+impl Normaliser {
+    pub fn new(config: &PlayerConfig, volume_getter: Box<dyn VolumeGetter>) -> Self {
+        Self {
+            normalisation: Normalisation::new(config),
+            volume_getter,
+            normalisation_type: config.normalisation_type,
+            pregain_db: config.normalisation_pregain_db,
+            threshold_dbfs: config.normalisation_threshold_dbfs,
+            factor: 1.0,
+        }
+    }
+
+    pub fn normalise(&mut self, samples: &[f64]) -> AudioPacket {
+        let volume = self.volume_getter.attenuation_factor();
+
+        AudioPacket::Samples(self.normalisation.normalise(samples, volume, self.factor))
+    }
+
+    pub fn stop(&mut self) {
+        self.normalisation.stop();
+    }
+
+    pub fn set_factor(&mut self, auto_normalise_as_album: bool, data: NormalisationData) {
+        if self.normalisation != Normalisation::None {
+            self.factor = self.get_factor(auto_normalise_as_album, data);
+        }
+    }
+
+    fn get_factor(&self, auto_normalise_as_album: bool, data: NormalisationData) -> f64 {
+        let (gain_db, gain_peak, norm_type) = match self.normalisation_type {
+            NormalisationType::Album => (
+                data.album_gain_db,
+                data.album_peak,
+                NormalisationType::Album,
+            ),
+            NormalisationType::Track => (
+                data.track_gain_db,
+                data.track_peak,
+                NormalisationType::Track,
+            ),
+            NormalisationType::Auto => {
+                if auto_normalise_as_album {
+                    (
+                        data.album_gain_db,
+                        data.album_peak,
+                        NormalisationType::Album,
+                    )
+                } else {
+                    (
+                        data.track_gain_db,
+                        data.track_peak,
+                        NormalisationType::Track,
+                    )
+                }
+            }
+        };
+
+        // As per the ReplayGain 1.0 & 2.0 (proposed) spec:
+        // https://wiki.hydrogenaud.io/index.php?title=ReplayGain_1.0_specification#Clipping_prevention
+        // https://wiki.hydrogenaud.io/index.php?title=ReplayGain_2.0_specification#Clipping_prevention
+        let normalisation_factor = if self.normalisation == Normalisation::Basic {
+            // For Basic Normalisation, factor = min(ratio of (ReplayGain + PreGain), 1.0 / peak level).
+            // https://wiki.hydrogenaud.io/index.php?title=ReplayGain_1.0_specification#Peak_amplitude
+            // https://wiki.hydrogenaud.io/index.php?title=ReplayGain_2.0_specification#Peak_amplitude
+            // We then limit that to 1.0 as not to exceed dBFS (0.0 dB).
+            let factor = f64::min(
+                db_to_ratio(gain_db + self.pregain_db),
+                PCM_AT_0DBFS / gain_peak,
+            );
+
+            if factor > PCM_AT_0DBFS {
+                info!(
+                    "Lowering gain by {:.2} dB for the duration of this track to avoid potentially exceeding dBFS.",
+                    ratio_to_db(factor)
+                );
+
+                PCM_AT_0DBFS
+            } else {
+                factor
+            }
+        } else {
+            // For Dynamic Normalisation it's up to the player to decide,
+            // factor = ratio of (ReplayGain + PreGain).
+            // We then let the dynamic limiter handle gain reduction.
+            let factor = db_to_ratio(gain_db + self.pregain_db);
+            let threshold_ratio = db_to_ratio(self.threshold_dbfs);
+
+            if factor > PCM_AT_0DBFS {
+                let factor_db = gain_db + self.pregain_db;
+                let limiting_db = factor_db + self.threshold_dbfs.abs();
+
+                warn!(
+                    "This track may exceed dBFS by {:.2} dB and be subject to {:.2} dB of dynamic limiting at it's peak.",
+                    factor_db, limiting_db
+                );
+            } else if factor > threshold_ratio {
+                let limiting_db = gain_db + self.pregain_db + self.threshold_dbfs.abs();
+
+                info!(
+                    "This track may be subject to {:.2} dB of dynamic limiting at it's peak.",
+                    limiting_db
+                );
+            }
+
+            factor
+        };
+
+        debug!("Normalisation Data: {:?}", data);
+        debug!(
+            "Calculated Normalisation Factor for {:?}: {:.2}%",
+            norm_type,
+            normalisation_factor * 100.0
+        );
+
+        normalisation_factor
+    }
+}