HART/hart__correlation__above_8hpp_source.html

#pragma once


#include <cmath>  // round()

#include <iomanip>

#include <vector>

#include <sstream>


#include "hart_accurate_sum.hpp"

#include "hart_exceptions.hpp"

#include "hart_matcher.hpp"

#include "hart_precision.hpp"

#include "hart_utils.hpp"                  // inf, floatsEqual()


namespace hart

{


/// @brief Checks whether the output signal is sufficiently correlated with the input signal

/// @details

/// Uses normalized cross-correlation in the time domain to compare input and output audio,

/// while searching for the best match within a configurable lag range.

/// Correlation is calculated independently for every applicable channel using the formula:

/// @f[

/// \frac{\sum_n x[n]\,y[n+k]}

///      {\sqrt{\left(\sum_n x[n]^2\right)\left(\sum_n y[n+k]^2\right)}}

/// @f]

///

/// (`sum (x[n] * y[n+k]) / sqrt (sum (x[n]^2) * sum (y[n+k]^2))`),

///

/// where `x` is input signal and `y` is observed output signal.

///

/// For multi-channel audio, the lowest correlation value across all applicable channels is used.

/// This matcher is useful for verifying transparent DSP, latency compensation, bypass paths,

/// or processors that preserve waveform shape while introducing delay or mild coloration.

/// Notes:

/// - Gain differences do not affect the result due to normalization.

/// - Constant DC offset reduces correlation.

/// - Heavy nonlinear processing may significantly reduce correlation.

/// - The absolute value of correlation is used, so polarity inversions do not affect the result.

/// @tparam SampleType Floating point sample type, typically `float` or `double`

/// @ingroup Matchers

/// @deprecated Use `hart::crossCorrelation()` metric instead

template <typename SampleType>

class

HART_DEPRECATED("Use hart::crossCorrelation() metric instead")

CorrelationAbove :

    public Matcher<SampleType, CorrelationAbove<SampleType>>

{

public:


    /// @brief Creates a correlation matcher with a minimum accepted correlation threshold

    /// @details The matcher scans lags in the range `[-maxLagSeconds, +maxLagSeconds]`

    /// and finds the best normalized cross-correlation value.

    /// A value of `1.0` requires a perfect waveform match (ignoring polarity and latency),

    /// while lower values allow progressively more waveform deviation.

    /// @param minCorrelation Minimum allowed absolute correlation in the range `[0, 1]`

    /// @param maxLagSeconds Maximum absolute lag to search in seconds

    CorrelationAbove (double minCorrelation, double maxLagSeconds = 0.01):

        m_minCorrelation (minCorrelation),

        m_maxLagSeconds (maxLagSeconds)

    {

        if (m_minCorrelation < 0 || m_minCorrelation > 1.0)

            HART_THROW_OR_RETURN (hart::ValueError, "Correlation should be in 0..1 range", false);


        if (m_maxLagSeconds < 0)

            HART_THROW_OR_RETURN (hart::ValueError, "Max lag should be a non-negative number in seconds", false);

    }


    void prepare (double sampleRateHz, size_t /* numInputChannels */, size_t /* numOutputChannels */, size_t /*maxBlockSizeFrames*/) override

    {

        m_sampleRateHz = sampleRateHz;

        m_maxLagFrames = static_cast<long long int> (std::round (m_maxLagSeconds * m_sampleRateHz));

    }


    bool canOperatePerBlock() const override

    {

        return false;

    }


    void reset() override

    {

        m_failureChannel = 0;

        m_failureFrame = 0;

        m_bestCorrelation = 0.0;

        m_bestLagFrames = 0;

        m_hadValidData = false;

    }


    bool supportsChannelLayout (size_t numInputChannels, size_t numOutputChannels) const override

    {

        return numInputChannels == numOutputChannels;

    }


    bool match (AnalysisContext<SampleType> context) override

    {

        const AudioBuffer<SampleType>& inputAudio = context.inputAudio();

        const AudioBuffer<SampleType>& observedOutputAudio = context.outputAudio();


        hassert (inputAudio.getNumChannels() == observedOutputAudio.getNumChannels());

        hassert (inputAudio.getNumFrames() == observedOutputAudio.getNumFrames());

        hassert (inputAudio.getSampleRateHz() == observedOutputAudio.getSampleRateHz());


        const size_t numChannels = inputAudio.getNumChannels();

        const size_t numFrames = inputAudio.getNumFrames();


        if (numFrames == 0)

        {

            m_hadValidData = false;

            return false;

        }


        double worstChannelCorrelation = hart::inf;

        size_t worstChannel = 0;

        bool anyValidChannel = false;


        for (size_t channel = 0; channel < numChannels; ++channel)

        {

            if (! this->appliesToChannel (channel))

                continue;


            double bestCorrelation = -hart::inf;

            long long int bestLag = 0;

            bool channelValid = false;


            const SampleType* x = inputAudio[channel];

            const SampleType* y = observedOutputAudio[channel];

            std::vector<double> prefixSumsSqX (numFrames + 1, 0.0);

            std::vector<double> prefixSumsSqY (numFrames + 1, 0.0);

            AccurateSum<double> runningSumSqX { 0.0 };

            AccurateSum<double> runningSumSqY { 0.0 };


            for (size_t frame = 0; frame < numFrames; ++frame)

            {

                const double xVal = static_cast<double> (x[frame]);

                const double yVal = static_cast<double> (y[frame]);


                runningSumSqX += xVal * xVal;

                runningSumSqY += yVal * yVal;

                prefixSumsSqX[frame + 1] = runningSumSqX;

                prefixSumsSqY[frame + 1] = runningSumSqY;

            }


            // Formula:

            // sum (x[n] * y[n+k]) / sqrt (sum (x[n]^2) * sum (y[n+k]^2))


            for (long long int lag = -m_maxLagFrames; lag <= m_maxLagFrames; ++lag)

            {

                AccurateSum<double> dotProduct { 0.0 };

                const bool lagShiftsOutputToTheLeft = lag < 0;

                const size_t lagAbsFrames = static_cast<size_t> (lagShiftsOutputToTheLeft ? -lag : lag);


                if (lagAbsFrames >= numFrames)

                    continue;


                // For a given lag, correlate only the valid overlap interval:

                // x[inputOverlapBeginFrame + offset] with y[outputOverlapBeginFrame + offset].

                const size_t inputOverlapBeginFrame = lagShiftsOutputToTheLeft ? lagAbsFrames : 0;

                const size_t outputOverlapBeginFrame = lagShiftsOutputToTheLeft ? 0 : lagAbsFrames;

                const size_t overlapSizeFrames = numFrames - lagAbsFrames;

                const size_t inputOverlapEndFrame = inputOverlapBeginFrame + overlapSizeFrames;

                const size_t outputOverlapEndFrame = outputOverlapBeginFrame + overlapSizeFrames;

                const double sumSqX = prefixSumsSqX[inputOverlapEndFrame] - prefixSumsSqX[inputOverlapBeginFrame];

                const double sumSqY = prefixSumsSqY[outputOverlapEndFrame] - prefixSumsSqY[outputOverlapBeginFrame];


                for (size_t overlapFrame = 0; overlapFrame < overlapSizeFrames; ++overlapFrame)

                {

                    const double xnValue = static_cast<double> (x[inputOverlapBeginFrame + overlapFrame]);

                    const double ynValue = static_cast<double> (y[outputOverlapBeginFrame + overlapFrame]);

                    dotProduct += xnValue * ynValue;

                }


                if (floatsEqual (sumSqX, 0.0) || floatsEqual (sumSqY, 0.0))

                    continue;


                channelValid = true;

                const double corr = dotProduct / std::sqrt (sumSqX * sumSqY);

                const double absCorr = std::abs (corr);


                if (absCorr > bestCorrelation)

                {

                    bestCorrelation = absCorr;

                    bestLag = lag;

                }


                if (floatsEqual (absCorr, 1.0))

                {

                    bestCorrelation = absCorr;

                    bestLag = lag;

                    break;

                }

            }


            if (! channelValid)

                continue;


            anyValidChannel = true;


            if (bestCorrelation < worstChannelCorrelation)

            {

                worstChannelCorrelation = bestCorrelation;

                worstChannel = channel;

                m_bestCorrelation = bestCorrelation;

                m_bestLagFrames = bestLag;

            }

        }


        if (! anyValidChannel)

        {

            m_hadValidData = false;

            m_failureChannel = 0;

            m_failureFrame = 0;

            return false;

        }


        m_hadValidData = true;


        if (worstChannelCorrelation >= m_minCorrelation)

            return true;


        m_failureChannel = worstChannel;

        m_failureFrame = 0; // no specific frame failure


        return false;

    }


    MatcherFailureDetails getFailureDetails() const override

    {

        MatcherFailureDetails details;

        details.channel = m_failureChannel;

        details.frame = m_failureFrame;


        if (! m_hadValidData)

        {

            details.description = "Correlation could not be computed (no valid signal overlap)";

            return details;

        }


        const double lagSeconds = m_bestLagFrames / m_sampleRateHz;

        std::stringstream stream;


        stream

            << "Best correlation: " << correlationPrecision << m_bestCorrelation

            << " at lag " << m_bestLagFrames << " frames ("

            << secPrecision << lagSeconds << " seconds)";


        details.description = stream.str();

        return details;

    }


    void represent (std::ostream& stream) const override

    {

        stream

            << "CorrelationAbove ("

            << correlationPrecision << m_minCorrelation << ", "

            << secPrecision << m_maxLagSeconds << "_s)";

    }


private:

    const double m_minCorrelation;

    const double m_maxLagSeconds;


    double m_sampleRateHz = 0.0;

    long long int m_maxLagFrames = 0;


    double m_bestCorrelation = 0.0;

    long long m_bestLagFrames = 0;


    size_t m_failureChannel = 0;

    size_t m_failureFrame = 0;

    bool m_hadValidData = false;

};


HART_MATCHER_DECLARE_ALIASES_FOR (CorrelationAbove)


} // namespace hart

hart::AccurateSum
Implements Kahan algorithm for floating point accumulations.
Definition hart_accurate_sum.hpp:11

hart::AccurateSum::AccurateSum
AccurateSum(SampleType initialSum=(SampleType) 0)
Inits AccurateSum with a specific value.
Definition hart_accurate_sum.hpp:15

hart::AccurateSum::operator+=
AccurateSum & operator+=(SampleType value)
Adds a value to a sum, tracking the potential floating point error.
Definition hart_accurate_sum.hpp:33

hart::AnalysisContext
Contains audio-related artefacts useful for analysis by matchers.
Definition hart_analysis_context.hpp:23

hart::AudioBuffer
Container for audio data.
Definition hart_audio_buffer.hpp:27

hart::Matcher
Base for audio matchers.
Definition hart_matcher.hpp:189

hart::ValueError
Thrown when an inappropriate value is encountered.
Definition hart_exceptions.hpp:47

hassert
#define hassert(condition)
Triggers a HartAssertException if the condition is false
Definition hart_exceptions.hpp:172

HART_THROW_OR_RETURN
#define HART_THROW_OR_RETURN(ExceptionType, message, returnValue)
Throws an exception if HART_DO_NOT_THROW_EXCEPTIONS is set, prints a message and returns a specified ...
Definition hart_exceptions.hpp:153

hart::secPrecision
std::ostream & secPrecision(std::ostream &stream)
Sets number of decimal places for values in seconds.
Definition hart_precision.hpp:34

hart::correlationPrecision
static std::ostream & correlationPrecision(std::ostream &stream)
Sets number of decimal places for correlation values.
Definition hart_precision.hpp:65

HART_DEPRECATED
#define HART_DEPRECATED(msg)
Definition hart_utils.hpp:248

hart::inf
constexpr double inf
Infinity.
Definition hart_utils.hpp:23

hart::floatsEqual
static SampleType floatsEqual(SampleType a, SampleType b, SampleType epsilon=(SampleType) 1e-8)
Compares two floating point numbers within a given tolerance.
Definition hart_utils.hpp:142

HART_MATCHER_DECLARE_ALIASES_FOR
#define HART_MATCHER_DECLARE_ALIASES_FOR(ClassName)
Definition hart_matcher.hpp:361

hart
Definition hart_additive_noise.hpp:13

hart::MatcherFailureDetails
Details about matcher failure.
Definition hart_matcher_failure_details.hpp:14

hart::MatcherFailureDetails::channel
size_t channel
Index of channel at which the failure was detected.
Definition hart_matcher_failure_details.hpp:16

hart::MatcherFailureDetails::description
std::string description
Readable description of why the match has failed.
Definition hart_matcher_failure_details.hpp:17

hart::MatcherFailureDetails::frame
size_t frame
Index of frame at which the match has failed.
Definition hart_matcher_failure_details.hpp:15