HART/hart__max__cross__correlation_8hpp_source.html

#pragma once


#include <algorithm>  // min()

#include <cmath>  // abs()


#include "hart_accurate_sum.hpp"

#include "hart_audio_buffer.hpp"

#include "hart_exceptions.hpp"

#include "metrics/hart_metric_query.hpp"

#include "metrics/hart_metrics_common.hpp"  // CorrelationSearchMode, ChannelSubsets

#include "hart_slice.hpp"

#include "hart_units.hpp"                  // Unit

#include "hart_utils.hpp"                  // roundToSizeT()


namespace hart

{


/// @brief Calculates maximum normalized cross-correlation between two audio buffers

/// @details

/// Searches for the best normalized cross-correlation value within a specified

/// lag range independently for each selected pair of channels.

///

/// Cross-correlation is calculated using the following formula:

/// @f[

/// \frac{\sum_n x[n]\,y[n+k]}

///      {\sqrt{

///          \left(\sum_n x[n]^2\right)

///          \left(\sum_n y[n+k]^2\right)

///      }}

/// @f]

///

/// (`sum (x[n] * y[n + k]) / sqrt (sum (x[n]^2) * sum (y[n + k]^2))`)

///

/// where:

/// - `x[n]` is the left-hand-side signal

/// - `y[n + k]` is the right-hand-side signal shifted by lag `k`

/// - `k` is searched in the range `[-maxLag, +maxLag]`

///

/// The result is normalized to the range `[-1, 1]`, where:

/// - `+1` means perfect positive correlation

/// - `-1` means perfect negative correlation (polarity inversion)

/// - `0` means no linear correlation

///

/// Depending on @p searchMode, the metric either:

/// - searches for the largest signed correlation value

/// - or searches for the largest absolute correlation value while still returning

///   the original signed correlation.

///

/// Correlation is calculated independently for each selected pair of channels.

/// Use a reducer to combine multiple channel-pair results into a scalar.

///

/// Usage examples:

/// @code

/// // Mono signals, default channel mapping {0,0}

/// const double corr = maxCrossCorrelation (monoInput, monoOutput, 100_ms).get();

///

/// // Same, but polarity-invariant lag search

/// const double corrAbs = maxCrossCorrelation (

///     monoInput,

///     monoOutput,

///     100_ms,

///     bestAbsoluteCorrelation

/// ).get();

///

/// // Stereo signals, strongest matched pair correlation

/// const double maxCorr = maxCrossCorrelation (stereoInput, stereoOutput, 100_ms).get (max());

///

/// // Cross-map channels explicitly

/// const double swappedCorr = maxCrossCorrelation (input, output, 100_ms)

///     .ch ({ {0, 1}, {1, 0} })

///     .get (min());

///

/// // Detect polarity inversion

/// const double corrSigned = maxCrossCorrelation (

///     input,

///     invertedOutput,

///     100_ms,

///     bestAbsoluteCorrelation

/// ).get();

///

/// HART_EXPECT_LT (corrSigned, 0.0);

/// @endcode

///

/// Notes:

/// - Gain differences do not affect the result due to normalization.

/// - DC offset may reduce correlation.

/// - Heavy non-linear processing may significantly reduce correlation.

/// - Returned value remains signed even in `bestAbsoluteCorrelation` mode.

/// - If no valid overlap exists, returns `NaN`.

///

/// Supports only `Unit::native` and `Unit::none` units.

///

/// @param bufferA Left-hand-side audio buffer

/// @param bufferB Right-hand-side audio buffer

/// @param maxLagSeconds Maximum lag to search in seconds

/// @param searchMode Controls how the best lag is selected, see @ref `CorrelationSearchMode`

///

/// @return MetricQuery containing signed normalized cross-correlation values

///

/// @tparam SampleType Floating point sample type, typically `float` or `double`

///

/// @throws hart::ValueError If `maxLagSeconds` is negative

/// @throws hart::SampleRateError If sample rates differ

/// @throws hart::IndexError If requested channel indices are out of range

/// @throws hart::UnitError If unsupported unit is requested

///

/// @ingroup Metrics

template <typename SampleType>

MetricQuery<double> maxCrossCorrelation (

    const AudioBuffer<SampleType>& bufferA,

    const AudioBuffer<SampleType>& bufferB,

    double maxLagSeconds,

    CorrelationSearchMode searchMode = bestAbsoluteCorrelation

)

{

    if (maxLagSeconds < 0.0)

        HART_THROW_OR_RETURN (hart::ValueError,"Maximum lag must be non-negative", {});


    if ((bufferA.hasSampleRate() || bufferB.hasSampleRate()) && bufferA.getSampleRateHz() != bufferB.getSampleRateHz())

        HART_THROW_OR_RETURN (hart::SampleRateError, "Audio buffers must have equal sample rates", {});


    typename MetricQuery<double>::ChannelPairMetricEvaluator evaluator =

        [&bufferA, &bufferB, maxLagSeconds, searchMode]

        (size_t channelA,size_t channelB, Slice slice, Unit requestedUnit)

        -> double

    {

        // Should be checked by MetricQuery

        hassert (channelA < bufferA.getNumChannels());

        hassert (channelB < bufferB.getNumChannels());


        if (requestedUnit != Unit::native && requestedUnit != Unit::none)

            HART_THROW_OR_RETURN (hart::UnitError, "Cross-correlation does not support requested unit", hart::nan<double>());


        if (slice.isEmpty())

            return hart::nan<double>();


        const auto sliceFrameIndices = bufferA.getFrameIndices (slice);

        const size_t sliceStart = sliceFrameIndices.first;

        const size_t sliceStop = sliceFrameIndices.second;

        hassert (sliceStop > sliceStart);

        hassert (sliceStop <= bufferA.getNumFrames());

        hassert (sliceStop <= bufferB.getNumFrames());


        const size_t numFrames = sliceStop - sliceStart;

        hassert (numFrames != 0);


        const double sampleRateHz = bufferA.getSampleRateHz();

        const size_t maxLagFrames = roundToSizeT (maxLagSeconds * sampleRateHz);


        const SampleType* x = bufferA[channelA] + sliceStart;

        const SampleType* y = bufferB[channelB] + sliceStart;


        double bestCorrelation = (searchMode == bestSignedCorrelation) ? -hart::inf : 0.0;

        bool hadValidOverlap = false;


        for (int lag = -static_cast<int> (maxLagFrames); lag <= static_cast<int> (maxLagFrames); ++lag)

        {

            const bool lagIsNegative = lag < 0;

            const size_t lagAbsFrames = static_cast<size_t> (lagIsNegative ? -lag : lag);


            if (lagAbsFrames >= numFrames)

                continue;


            const size_t xBegin = lagIsNegative ? lagAbsFrames : 0;

            const size_t yBegin = lagIsNegative ? 0 : lagAbsFrames;

            const size_t overlapFrames = numFrames - lagAbsFrames;


            AccurateSum<double> dotProduct;

            AccurateSum<double> sumSquaresX;

            AccurateSum<double> sumSquaresY;


            for (size_t frame = 0; frame < overlapFrames; ++frame)

            {

                const double xn = static_cast<double> (x[xBegin + frame]);

                const double yn = static_cast<double> (y[yBegin + frame]);


                dotProduct += xn * yn;

                sumSquaresX += xn * xn;

                sumSquaresY += yn * yn;

            }


            const double energyX = sumSquaresX.getValue();

            const double energyY = sumSquaresY.getValue();


            if (floatsEqual (energyX, 0.0) || floatsEqual (energyY, 0.0))

                continue;


            hadValidOverlap = true;

            const double correlation = dotProduct.getValue() / std::sqrt (energyX * energyY);


            if (searchMode == bestSignedCorrelation)

            {

                if (correlation > bestCorrelation)

                    bestCorrelation = correlation;

            }

            else  // bestAbsoluteCorrelation

            {

                if (std::abs (correlation) > std::abs (bestCorrelation))

                    bestCorrelation = correlation;

            }


            if (floatsEqual (std::abs (bestCorrelation), 1.0))

                break;

        }


        if (! hadValidOverlap)

            return hart::nan<double>();


        return bestCorrelation;

    };


    const size_t numPairs = std::min (bufferA.getNumChannels(), bufferB.getNumChannels());

    return MetricQuery<double> (

        std::move (evaluator),

        bufferA.getNumChannels(),

        bufferB.getNumChannels(),

        ChannelSubsets::diagonalChannelPairs (numPairs)

    );

}


}  // namespace hart

hart::AccurateSum
Implements Kahan algorithm for floating point accumulations.
Definition hart_accurate_sum.hpp:11

hart::AccurateSum::getValue
SampleType getValue() const
Definition hart_accurate_sum.hpp:55

hart::AccurateSum::operator+=
AccurateSum & operator+=(SampleType value)
Adds a value to a sum, tracking the potential floating point error.
Definition hart_accurate_sum.hpp:33

hart::AudioBuffer
Container for audio data.
Definition hart_audio_buffer.hpp:27

hart::MetricQuery
Manages the metrics calculations.
Definition hart_metric_query.hpp:43

hart::SampleRateError
Thrown when sample rate is mismatched.
Definition hart_exceptions.hpp:55

hart::UnitError
Thrown when some metric is requested to return a value in an unsupported unit.
Definition hart_exceptions.hpp:112

hart::ValueError
Thrown when an inappropriate value is encountered.
Definition hart_exceptions.hpp:47

hassert
#define hassert(condition)
Triggers a HartAssertException if the condition is false
Definition hart_exceptions.hpp:172

HART_THROW_OR_RETURN
#define HART_THROW_OR_RETURN(ExceptionType, message, returnValue)
Throws an exception if HART_DO_NOT_THROW_EXCEPTIONS is set, prints a message and returns a specified ...
Definition hart_exceptions.hpp:153

hart::maxCrossCorrelation
MetricQuery< double > maxCrossCorrelation(const AudioBuffer< SampleType > &bufferA, const AudioBuffer< SampleType > &bufferB, double maxLagSeconds, CorrelationSearchMode searchMode=bestAbsoluteCorrelation)
Calculates maximum normalized cross-correlation between two audio buffers.
Definition hart_max_cross_correlation.hpp:109

hart::nan
FloatType nan()
Returns a quiet NaN value for the given floating-point type.
Definition hart_utils.hpp:80

hart::roundToSizeT
static size_t roundToSizeT(SampleType x)
Rounds a floating point value to a size_t value.
Definition hart_utils.hpp:156

hart::inf
constexpr double inf
Infinity.
Definition hart_utils.hpp:23

hart::floatsEqual
static SampleType floatsEqual(SampleType a, SampleType b, SampleType epsilon=(SampleType) 1e-8)
Compares two floating point numbers within a given tolerance.
Definition hart_utils.hpp:142

hart
Definition hart_additive_noise.hpp:13

hart::CorrelationSearchMode
CorrelationSearchMode
Describes how to look for best cross-correlation.
Definition hart_metrics_common.hpp:108

hart::bestSignedCorrelation
@ bestSignedCorrelation
Definition hart_metrics_common.hpp:109

hart::bestAbsoluteCorrelation
@ bestAbsoluteCorrelation
Definition hart_metrics_common.hpp:110

hart::Unit
Unit
Represents a physical unit.
Definition hart_units.hpp:21

hart::Unit::none
@ none
Unitless value.

hart::Unit::native
@ native
Default (native) unit of whatever returns some value.

hart::ChannelSubsets
Helpers to generate common default channel subsets.
Definition hart_metrics_common.hpp:17

hart::ChannelSubsets::diagonalChannelPairs
static std::vector< std::pair< size_t, size_t > > diagonalChannelPairs(size_t numChannels)
Definition hart_metrics_common.hpp:40

hart::Slice
Represents a slice of analysis data.
Definition hart_slice.hpp:26

hart::Slice::isEmpty
bool isEmpty() const
Definition hart_slice.hpp:40