VAE-Docs/vae__spatial__processor_8hpp_source.html

#ifndef _VAE_SPATIAL_PROCESSOR

#define _VAE_SPATIAL_PROCESSOR


#include "../vae_types.hpp"

#include "../vae_util.hpp"

#include "../pod/vae_bank.hpp"

#include "../voices/vae_voice.hpp"

#include "../voices/vae_voice_filter.hpp"

#include "../voices/vae_voice_pan.hpp"

#include "../voices/vae_voice_hrtf.hpp"

#include "../vae_voice_manager.hpp"

#include "../vae_spatial_manager.hpp"

#include "../algo/vae_spcap.hpp"

#include "../algo/vae_hrtf_util.hpp"


#include "../fs/vae_hrtf_loader.hpp"

#include "../../../external/glm/glm/gtc/matrix_transform.hpp"


namespace vae { namespace core {

    class SpatialProcessor {

        HRTF mHRTF;                             ///< Currently loaded HRTF, there can only be one

        HRTFLoader mHRTFLoader;                 ///< Struct to decode the hrtf

        HeapBuffer<VoiceHRTF> mVoiceHRTFs;      ///< Working data for convolution

        /**

         * @brief Temporary filtered/looped signal TODO this will not work with parallel bank processing

         */

        ScratchBuffer mScratchBuffer;

    public:

        Result init(Size hrtfVoices) {

            VAE_PROFILER_SCOPE_NAMED("Spatial Processor Init")

            mVoiceHRTFs.resize(hrtfVoices);

            mScratchBuffer.resize(StaticConfig::MaxBlock);

            return Result::Success;

        }


        /**

         * @brief Process a single bank

         *

         * @param manager

         * @param banks

         * @param frames

         * @param sampleRate

         * @return Number of voices mixed

         */

        Size mix(

            VoiceManger& manager, Bank& bank,

            SpatialManager& spatial,

            SampleIndex frames, Size sampleRate

        ) {

            Size actuallyRendered = 0;

            VAE_PROFILER_SCOPE_NAMED("Spatial Processor")

            manager.forEachVoice([&](Voice& v, Size vi) {

                if (v.bank != bank.id) { return true; }     // wrong bank

                if (!v.spatialized) { return true; }        // not spatialized

                VAE_PROFILER_SCOPE_NAMED("Spatial Voice")

                if (!spatial.hasEmitter(v.emitter)) {

                    VAE_DEBUG("Spatial voice is missing emitter")

                    return false; // ! needs emitter

                }


                auto& source = bank.sources[v.source];

                auto& signal = source.signal;


                const auto signalLength = signal.size();


                if (signalLength == 0) { return false; }    // ! no signal


                v.time = v.time % signalLength;     // Keep signal in bounds before starting


                if (signal.sampleRate != sampleRate) {

                    // VAE_DEBUG("Spatial Voice samplerate mismatch. Enabled filter.")

                    v.filtered = true; // implicitly filter to resample

                }


                auto& emitter = spatial.getEmitter(v.emitter);

                auto& target = bank.mixers[v.mixer].buffer;

                const Sample gain = v.gain * source.gain;

                auto& l = spatial.getListeners()[v.listener];


                Real distanceAttenuated;

                Vec3 relativeDirection;

                // * Attenuation calculation

                {

                    VAE_PROFILER_SCOPE_NAMED("Attenuation calculation")

                    // samething as graphics, make the world rotate round the listener

                    // TODO this should be possible without a 4x4 matrix?

                    glm::mat4x4 lookAt = glm::lookAt(l.position, l.position + l.front, l.up);

                    // listener is the world origin now

                    relativeDirection = (lookAt * glm::vec4(emitter.position, 1.f));


                    const Real distance = std::max(glm::length(relativeDirection), 0.1f);

                    relativeDirection /= distance;


                    if (v.attenuate) {

                        distanceAttenuated = distance;

                        distanceAttenuated = std::max(distanceAttenuated, Real(1)); // we don't want to get louder than 1

                        distanceAttenuated = Real(1) / distanceAttenuated;

                    } else {

                        distanceAttenuated = 1.0;

                    }

                    distanceAttenuated *= gain;

                }


                if (distanceAttenuated < StaticConfig::MinVolume) {

                    return true; // ! inaudible

                    // TODO maybe progress still progress time?

                }

                actuallyRendered++;

                target.setValidSize(frames); // mark mtarget ixer as active

                v.audible = true;


                // * Filtering and looping logic


                // TODO This thing is littered with branches, maybe needs some cleanup


                const Sample* in;               // The filtered, looped original signal used for panning later. We only do mono signals

                SampleIndex remaining = frames; // playback speed and looping affects this

                bool finished = false;          // the return value of this function stops the voice


                if (v.filtered) {

                    VAE_PROFILER_SCOPE_NAMED("Voice Filter")

                    auto& fd = manager.getVoiceFilter(vi);


                    if (!v.started) {

                        // Initialize filter variables when first playing the voice

                        fd.highpassScratch[0]   = 0;

                        fd.lowpassScratch[0]    = signal[0][v.time];

                    }


                    // Playback speed taking samplerate into account

                    const Sample speed = fd.speed * (Sample(signal.sampleRate) / Sample(sampleRate));


                    if (!v.loop) {

                        // If we're not looping, end time calculation is a bit more complex

                        remaining = std::min(

                            frames,

                            SampleIndex(std::floor((signalLength - v.time) / speed - fd.timeFract))

                        );

                        finished = remaining != frames; // we might have reached the end

                    }


                    // fractional time, we need the value after the loop, so it's defined outside

                    Real position;

                    for (SampleIndex s = 0; s < frames; s++) {

                        // Linear interpolation between two samples

                        position = v.time + (s * speed) + fd.timeFract;

                        const Real lastPosition = std::floor(position);

                        const Size lastIndex = (Size) lastPosition;

                        const Size nextIndex = (Size) lastPosition + 1;


                        Real mix = position - lastPosition;

                        // mix = 0.5 * (1.0 - cos((mix) * 3.1416)); // cosine interpolation, introduces new harmonics somehow


                        // TODO 30% of the time in here is spent on the modulo

                        const Sample last = signal[0][lastIndex % signalLength];

                        const Sample next = signal[0][nextIndex % signalLength];

                        // linear resampling, sounds alright enough

                        const Sample in = (last + mix * (next - last)) * gain;


                        //  * super simple lowpass and highpass filter

                        // just lerps with a previous value

                        const Sample lpd = in + fd.lowpass * (fd.lowpassScratch[0] - in);

                        fd.lowpassScratch[0] = lpd;


                        const Sample hps = fd.highpassScratch[0];

                        const Sample hpd = hps + fd.highpass * (in - hps);

                        fd.highpassScratch[0] = hpd;


                        mScratchBuffer[0][s] = (lpd - hpd);

                    }

                    position += speed;                  // step to next sample

                    v.time = (SampleIndex) std::floor(position);        // split the signal in normal sample position

                    fd.timeFract = position - v.time;   // and fractional time for the next block

                    v.time = v.time;                    // set index back

                    in = mScratchBuffer[0];             // set the buffer to use for panning

                } else {

                    VAE_PROFILER_SCOPE_NAMED("Non filtered Voice")

                    if (v.loop) {

                        // put the looped signal in scratch buffer eventhough we're not filtering

                        // so panning doesn't need to worry about looping

                        for (SampleIndex s = 0; s < frames; s++) {

                            mScratchBuffer[0][s] = signal[0][(v.time + s) % signalLength];

                        }

                        v.time = (v.time + frames); // progress the time

                        in = mScratchBuffer[0];     // set buffer for panning

                        finished = false;           // never stop the voice

                    } else {

                        // Not filtering or looping

                        // Means we can use the original signal buffer but need to

                        // set the remaining samples so we don't run over the signal end

                        remaining = std::min(

                            frames, SampleIndex(signalLength - v.time

                        ));

                        in = signal[0] + v.time;

                        finished = remaining != frames; // we might have reached the end

                        v.time += remaining;            // progress time in voice

                    }

                }


                if (l.configuration == Listener::Configuration::HRTF && v.HRTF && mHRTF.rate) {

                    // * HRTF Panning

                    VAE_ASSERT(vi < mVoiceHRTFs.size()) // only the lower voice can use hrtfs

                    VAE_PROFILER_SCOPE_NAMED("Render HRTF")


                    Size closestIndex = HRTFUtil::closest(mHRTF, relativeDirection);


                    if (closestIndex == ~Size(0)) { return true; } // ! no hrtf found?


                    auto& hrtfVoice = mVoiceHRTFs[vi];


                    if (!v.started) { // clear old data

                        hrtfVoice.convolutionIndex = 0;

                        hrtfVoice.convolutionBuffer.set();

                    }


                    HRTFUtil::apply(

                        mHRTF.positions[closestIndex],

                        hrtfVoice, remaining, target, in, distanceAttenuated

                    );


                } else {

                    VAE_PROFILER_SCOPE_NAMED("Render SPCAP")

                    // * Normal SPCAP panning

                    auto& lastPan = manager.getVoicePan(vi);

                    VoicePan currentPan;

                    auto& currentVolumes = currentPan.volumes;

                    auto& lastVolumes = lastPan.volumes;


                    /**

                    * @brief Pan and mix templated lambda so we don't have to write this for each vonfig

                    * @param panner Get's a panner instance with pan() and speakers() function

                    */

                    const auto pan = [&](const auto& panner) {

                        // This is actually constexpr but not according to clangd

                        constexpr Size channels = std::min(Size(StaticConfig::MaxChannels), panner.speakers);

                        panner.pan(

                            relativeDirection, currentVolumes,

                            distanceAttenuated, emitter.spread

                        );


                        if (!v.started) {

                            // first time don't interpolate

                            for (Size c = 0; c < channels; c++) {

                                lastVolumes[c] = currentVolumes[c];

                            }

                        }


                        Sample t = 0;

                        for (SampleIndex s = 0; s < remaining; s++) {

                            const Sample sample = in[s];

                            // lerp between last and current channel volumes

                            // Not correct in terms of power convservation, but easy and efficient

                            for (Size c = 0; c < channels; c++) {

                                target[c][s] += sample * (lastVolumes[c] + t * (currentVolumes[c] - lastVolumes[c]));

                            }

                            t += Sample(1) / Sample(frames);

                        }

                    };


                    switch (l.configuration) {

                        case Listener::Configuration::HRTF:

                        case Listener::Configuration::Headphones:   pan(SPCAP::HeadphoneSPCAP); break;

                        case Listener::Configuration::Stereo:       pan(SPCAP::StereroSPCAP);   break;

                        case Listener::Configuration::Suround:      pan(SPCAP::SuroundSPCAP);   break;

                        case Listener::Configuration::Quadrophonic: pan(SPCAP::QuadSPCAP);      break;

                        case Listener::Configuration::Mono:         pan(SPCAP::MonoSPCAP);      break;

                    }


                    lastPan = std::move(currentPan);

                }

                v.started = true;

                if (finished) {

                    emitter.autoplaying = false;

                    return false;

                }

                return true;

            });

            return actuallyRendered;

        }


        Result loadHRTF(const char* path, Size length, const char* rootPath, Size sampleRate) {

            Result result = mHRTFLoader.load(path, length, rootPath, sampleRate, mHRTF);

            if (result != Result::Success) { return result; }

            for (auto& i : mVoiceHRTFs) {

                i.convolutionBuffer.resize(mHRTF.irLength);

                i.convolutionBuffer.set();

            }

            return Result::Success;

        }

    };


    constexpr int _VAE_SPATIAL_PROCESSOR_SIZE = sizeof(SpatialProcessor);


} } // core::vae


#endif // _VAE_SPATIAL_PROCESSOR

tklb::AudioBufferTpl< Sample, tklb::HeapBuffer< Sample, tklb::DEFAULT_ALIGNMENT, memory::AllocatorScratch< unsigned char > > >

tklb::AudioBufferTpl::resize
bool resize(const Size length, uchar channels)
! Will not keep the contents! Resizes the buffer to the desired length and channel count.
Definition: TAudioBuffer.hpp:276

tklb::HeapBuffer
Basically a bad std::vector without exceptions which can also work with foreign memory.
Definition: THeapBuffer.hpp:49

vae::core::HRTFLoader
Definition: vae_hrtf_loader.hpp:21

vae::core::HRTFLoader::load
Result load(const char *path, Size length, const char *rootPath, const Size sampleRate, HRTF &hrtf)
Definition: vae_hrtf_loader.hpp:36

vae::core::SpatialManager
Definition: vae_spatial_manager.hpp:28

vae::core::SpatialManager::getListeners
Listeners & getListeners()
Definition: vae_spatial_manager.hpp:125

vae::core::SpatialManager::hasEmitter
bool hasEmitter(EmitterHandle e)
Definition: vae_spatial_manager.hpp:100

vae::core::SpatialManager::getEmitter
Emitter & getEmitter(EmitterHandle e)
Definition: vae_spatial_manager.hpp:95

vae::core::SpatialProcessor
Definition: vae_spatial_processor.hpp:20

vae::core::SpatialProcessor::mHRTFLoader
HRTFLoader mHRTFLoader
Struct to decode the hrtf.
Definition: vae_spatial_processor.hpp:22

vae::core::SpatialProcessor::mScratchBuffer
ScratchBuffer mScratchBuffer
Temporary filtered/looped signal TODO this will not work with parallel bank processing.
Definition: vae_spatial_processor.hpp:27

vae::core::SpatialProcessor::mVoiceHRTFs
HeapBuffer< VoiceHRTF > mVoiceHRTFs
Working data for convolution.
Definition: vae_spatial_processor.hpp:23

vae::core::SpatialProcessor::mix
Size mix(VoiceManger &manager, Bank &bank, SpatialManager &spatial, SampleIndex frames, Size sampleRate)
Process a single bank.
Definition: vae_spatial_processor.hpp:45

vae::core::SpatialProcessor::mHRTF
HRTF mHRTF
Currently loaded HRTF, there can only be one.
Definition: vae_spatial_processor.hpp:21

vae::core::SpatialProcessor::loadHRTF
Result loadHRTF(const char *path, Size length, const char *rootPath, Size sampleRate)
Definition: vae_spatial_processor.hpp:282

vae::core::SpatialProcessor::init
Result init(Size hrtfVoices)
Definition: vae_spatial_processor.hpp:29

vae::core::VoiceManger
There is only one voice pool and VAE and it's managed here.
Definition: vae_voice_manager.hpp:34

vae::core::VoiceManger::forEachVoice
void forEachVoice(const Func &&func)
Callback provided to iterate voices, needs to return a bool to indicate when a voice needs to be stop...
Definition: vae_voice_manager.hpp:81

tklb::min
T min(const T &v1, const T &v2)
Definition: TMath.hpp:16

vae::StaticConfig::MinVolume
constexpr Sample MinVolume
Minimum volume before sounds will skip rendering.
Definition: vae.hpp:307

vae::StaticConfig::MaxBlock
constexpr Size MaxBlock
Maximum block size.
Definition: vae.hpp:276

vae::StaticConfig::MaxChannels
constexpr unsigned char MaxChannels
Maximum channel count used to pre allocate buffers.
Definition: vae.hpp:268

vae::core::SampleIndex
AudioBuffer::Size SampleIndex
Definition: vae_types.hpp:87

vae::core::Real
float Real
Definition: vae_types.hpp:48

vae::core::Vec3
glm::vec3 Vec3
Definition: vae_types.hpp:47

vae::core::_VAE_SPATIAL_PROCESSOR_SIZE
constexpr int _VAE_SPATIAL_PROCESSOR_SIZE
Definition: vae_spatial_processor.hpp:293

vae
Contains Typedefinitions and basic structures use by the public API and internally.
Definition: vae.hpp:31

vae::Size
unsigned int Size
How the elements are addressed in the heapbuffer.
Definition: vae.hpp:33

vae::Sample
float Sample
Default sample types used where ever possible, changing this means the engine needs to be recompiled,...
Definition: vae.hpp:32

vae::Result
Result
Return Types for most engine functions.
Definition: vae.hpp:73

vae::Result::Success
@ Success
:)

vae::core::Bank
Bank object containing Sources, Mixers and Events Can be loaded and unloaded at runtime.
Definition: vae_bank.hpp:14

vae::core::Bank::mixers
HeapBuffer< Mixer > mixers
Audio Mixers which can have effects ! is presorted !
Definition: vae_bank.hpp:16

vae::core::Bank::id
BankHandle id
Definition: vae_bank.hpp:18

vae::core::Bank::sources
HeapBuffer< Source > sources
Audio sources defined.
Definition: vae_bank.hpp:15

vae::core::HRTF
Definition: vae_hrtf.hpp:8

vae::core::HRTF::irLength
Size irLength
Definition: vae_hrtf.hpp:16

vae::core::HRTF::rate
Size rate
Definition: vae_hrtf.hpp:15

vae::core::HRTF::positions
HeapBuffer< Position > positions
Definition: vae_hrtf.hpp:13

vae::core::HRTFUtil::apply
static void apply(HRTF::Position &hrtf, VoiceHRTF &hrtfVoice, SampleIndex frames, ScratchBuffer &target, const Sample *in, Sample distanceAttenuated)
Applies simple time domain convolution.
Definition: vae_hrtf_util.hpp:48

vae::core::Listener::Configuration::Suround
@ Suround
Definition: vae_listener.hpp:18

vae::core::Listener::Configuration::Quadrophonic
@ Quadrophonic
Definition: vae_listener.hpp:17

vae::core::Listener::Configuration::Mono
@ Mono
Definition: vae_listener.hpp:13

vae::core::Listener::Configuration::HRTF
@ HRTF
Definition: vae_listener.hpp:16

vae::core::Listener::Configuration::Headphones
@ Headphones
Definition: vae_listener.hpp:14

vae::core::Listener::Configuration::Stereo
@ Stereo
Definition: vae_listener.hpp:15

vae::core::SPCAP::StereroSPCAP
static const SPCAPConfig< 2 > StereroSPCAP
Definition: vae_spcap.hpp:84

vae::core::SPCAP::MonoSPCAP
static const SPCAPConfig< 1 > MonoSPCAP
TODO there's probably a smart way to make this all constexpr.
Definition: vae_spcap.hpp:82

vae::core::SPCAP::QuadSPCAP
static const SPCAPConfig< 4 > QuadSPCAP
Definition: vae_spcap.hpp:85

vae::core::SPCAP::SuroundSPCAP
static const SPCAPConfig< 5 > SuroundSPCAP
Definition: vae_spcap.hpp:86

vae::core::SPCAP::HeadphoneSPCAP
static const SPCAPConfig< 2 > HeadphoneSPCAP
Definition: vae_spcap.hpp:83

vae::core::Voice
Barebones voice.
Definition: vae_voice.hpp:17

vae::core::Voice::source
SourceHandle source
If invalid, means voice is not playing.
Definition: vae_voice.hpp:28

vae::core::Voice::spatialized
bool spatialized
If the voice has spatialization data.
Definition: vae_voice.hpp:18

vae::core::Voice::listener
ListenerHandle listener
If it's spatialized it's rendered for this listener.
Definition: vae_voice.hpp:32

vae::core::Voice::gain
Sample gain
Volume of the voice.
Definition: vae_voice.hpp:33

vae::core::Voice::audible
bool audible
Whether the voice was heard by any listener.
Definition: vae_voice.hpp:21

vae::core::Voice::bank
BankHandle bank
Which bank it belongs to.
Definition: vae_voice.hpp:27

vae::core::Voice::filtered
bool filtered
This will enable high/lowpass filters and variable speed playback. Gets turned on when signal does no...
Definition: vae_voice.hpp:24

vae::core::Voice::mixer
MixerHandle mixer
Where the voice should mix to.
Definition: vae_voice.hpp:31

vae::core::Voice::emitter
EmitterHandle emitter
Emitter used to control voice properties.
Definition: vae_voice.hpp:30

vae::core::Voice::loop
bool loop
Voice will loop until killed.
Definition: vae_voice.hpp:23

vae::core::Voice::time
SampleIndex time
Current time in samples.
Definition: vae_voice.hpp:34

VAE_PROFILER_SCOPE_NAMED
#define VAE_PROFILER_SCOPE_NAMED(name)
Profiles a scope and names it.
Definition: vae_profiler.hpp:73

VAE_ASSERT
#define VAE_ASSERT(condition)
Definition: vae_util.hpp:11