Spatial_Audio_Framework/saf__hades__internal_8h_source.html

/*

 * This file is part of the saf_hades module.

 * Copyright (c) 2021 - Leo McCormack & Janani Fernandez

 *

 * The saf_hades module is free software; you can redistribute it and/or

 * modify it under the terms of the GNU General Public License as published by

 * the Free Software Foundation; either version 2 of the License, or (at your

 * option) any later version.

 *

 * The saf_hades module is distributed in the hope that it will be useful, but

 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY

 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for

 * more details.

 *

 * See <http://www.gnu.org/licenses/> for a copy of the GNU General Public

 * License.

 */


#ifndef __SAF_HADES_INTERNAL_H_INCLUDED__

#define __SAF_HADES_INTERNAL_H_INCLUDED__


#include "saf_hades_analysis.h"

#include "saf_hades_synthesis.h"

#include "saf.h"

#include "saf_externals.h"


#ifdef __cplusplus

extern "C" {

#endif /* __cplusplus */


#ifdef  SAF_ENABLE_HADES_MODULE


#define HADES_MAX_BLOCKSIZE ( 4096 )


typedef struct _CxMic{

    float_complex Cx[HADES_MAX_NMICS*HADES_MAX_NMICS];

}CxMic;


/* ========================================================================== */

/*                           Main Internal Structs                            */

/* ========================================================================== */


typedef struct _hades_analysis_data

{

    /* User parameters (defined at intialisation stage) */

    float fs;

    HADES_FILTERBANKS fbOpt;

    int hopsize;

    int blocksize;

    int hybridmode;

    float* h_array;

    float* grid_dirs_deg;

    int nGrid;

    int nMics;

    int h_len;

    HADES_DIFFUSENESS_ESTIMATORS diffOpt;

    HADES_DOA_ESTIMATORS doaOpt;


    /* Optional user parameters (that can also be manipulated at run-time) */

    float covAvgCoeff;


    /* Time-frequency transform and array data */

    void* hFB_enc;

    int nBands;

    int timeSlots;

    int filterbankDelay;

    float* freqVector;

    float_complex* DCM_array;

    float_complex* H_array;

    float_complex* H_array_w;


    /* DoA and diffuseness estimator data */

    void* hEig;

    float_complex** T;

    void* hDoA;

    float* grid_dirs_xyz;

    float_complex* W;


    /* Run-time variables */

    float** inputBlock;

    CxMic* Cx;

    float_complex* V;

    float_complex* Vn;

    float* lambda;


}hades_analysis_data;


typedef struct _hades_synthesis_data

{

    /* User parameters */

    HADES_BEAMFORMER_TYPE beamOption;

    int enableCM;

    hades_binaural_config* binConfig;

    int refIndices[2];

    HADES_HRTF_INTERP_OPTIONS interpOption;


    /* Optional user parameters (that can also be manipulated at run-time) */

    float* eq;

    float* streamBalance;

    float synAvgCoeff;


    /* Things relevant to the synthesiser, which are copied from the hades_analysis_create() to keep everything aligned */

    HADES_FILTERBANKS fbOpt;

    int nBands;

    int hopsize;

    int blocksize;

    int nGrid;

    int nMics;

    float_complex* H_array;

    float* grid_dirs_deg;

    float** grid_dirs_xyz;

    int timeSlots;

    float* freqVector;

    float_complex* DCM_array;

    float_complex* W;


    /* Time-frequency transform */

    void* hFB_dec;


    /* HRTF and diffuse rendering variables */

    float_complex* H_bin;

    float_complex* DCM_bin_norm;

    float* diffEQ;


    /* Run-time variables */

    void* hPinv;

    void* hLinSolve;

    void* hCDF;

    float_complex* As;

    float_complex* As_l;

    float_complex* As_r;

    float_complex* Q_diff;

    float_complex* Q_dir;

    float_complex* Q;

    float_complex* Cy;

    float_complex* new_M;

    float_complex** M;


    /* Run-time audio buffers */

    float_complex*** outTF;

    float** outTD;


}hades_synthesis_data;


typedef struct _hades_param_container_data {

    int nBands;


    /* Estimated Parameters */

    float* diffuseness;

    int* doa_idx;

    int* gains_idx;


    /* Optional parameters */

    float* gains_dir;

    float* gains_diff;


} hades_param_container_data;


typedef struct _hades_radial_editor_data {

    int nBands;

    int nGrid;

    float* pGrid_dirs_deg;

    float* pGrid_dirs_xyz;


} hades_radial_editor_data;


typedef struct _hades_signal_container_data {

    int nMics;

    int nBands;

    int timeSlots;


    /* Covariance matrices and signal statistics computed during the analysis */

    CxMic* Cx;


    /* TF frame to carry over to a decoder */

    float_complex*** inTF;


} hades_signal_container_data;


/* ========================================================================== */

/*                             Internal Functions                             */

/* ========================================================================== */


void hades_getInterpolatedHRTFs(/* Input Arguments */

                                hades_analysis_handle const hAna,

                                HADES_HRTF_INTERP_OPTIONS interpOption,

                                hades_binaural_config* binConfig,

                                float* target_dirs_deg,

                                int nTargetDirs,

                                /* Output Arguments */

                                float_complex* hrtf_interp);


void hades_sdMUSIC_create(void ** const phMUSIC,

                          int nMics,

                          float* grid_dirs_deg,

                          int nDirs);


void hades_sdMUSIC_destroy(void ** const phMUSIC);


void hades_sdMUSIC_compute(/* Input arguments */

                           void* const hMUSIC,

                           float_complex* A_grid,

                           float_complex* Vn,

                           int nSrcs,

                           /* Output arguments */

                           float* P_music,

                           int* peak_inds);


float hades_comedie(float* lambda,

                    int N);


#endif /* SAF_ENABLE_HADES_MODULE */


#ifdef __cplusplus

} /* extern "C" */

#endif /* __cplusplus */


#endif /* __SAF_HADES_INTERNAL_H_INCLUDED__ */

saf.h
Main include header for the Spatial_Audio_Framework (SAF)

saf_externals.h
Include header for SAF externals.

saf_hades_analysis.h
Header for the HADES analysis (SAF_HADES_MODULE)

HADES_MAX_NMICS
#define HADES_MAX_NMICS
Maximum number of microphones.
Definition saf_hades_analysis.h:48

hades_analysis_handle
struct _hades_analysis_data * hades_analysis_handle
Handle for the hades analysis data.
Definition saf_hades_analysis.h:51

HADES_FILTERBANKS
HADES_FILTERBANKS
Filterbank options.
Definition saf_hades_analysis.h:80

HADES_DOA_ESTIMATORS
HADES_DOA_ESTIMATORS
Options for DoA estimation for hades_analysis.
Definition saf_hades_analysis.h:75

HADES_DIFFUSENESS_ESTIMATORS
HADES_DIFFUSENESS_ESTIMATORS
Options for diffuseness estimation for hades_analysis.
Definition saf_hades_analysis.h:70

hades_sdMUSIC_destroy
void hades_sdMUSIC_destroy(void **const phMUSIC)
Destroys an instance of the spherical harmonic domain MUSIC implementation, which may be used for com...
Definition saf_hades_internal.c:157

hades_sdMUSIC_create
void hades_sdMUSIC_create(void **const phMUSIC, int nMics, float *grid_dirs_deg, int nDirs)
Creates an instance of the space-domain MUSIC implementation.
Definition saf_hades_internal.c:130

hades_getInterpolatedHRTFs
void hades_getInterpolatedHRTFs(hades_analysis_handle const hAna, HADES_HRTF_INTERP_OPTIONS interpOption, hades_binaural_config *binConfig, float *target_dirs_deg, int nTargetDirs, float_complex *hrtf_interp)
Binaural filter interpolator.
Definition saf_hades_internal.c:43

hades_sdMUSIC_compute
void hades_sdMUSIC_compute(void *const hMUSIC, float_complex *A_grid, float_complex *Vn, int nSrcs, float *P_music, int *peak_inds)
Computes a pseudo-spectrum based on the MUSIC algorithm optionally returning the grid indices corresp...
Definition saf_hades_internal.c:178

hades_comedie
float hades_comedie(float *lambda, int N)
Returns an estimate of the diffuseness, based on [1].
Definition saf_hades_internal.c:243

saf_hades_synthesis.h
Header for the HADES synthesis (SAF_HADES_MODULE)

HADES_BEAMFORMER_TYPE
HADES_BEAMFORMER_TYPE
Beamforming options for hades_synthesis.
Definition saf_hades_synthesis.h:71

HADES_HRTF_INTERP_OPTIONS
HADES_HRTF_INTERP_OPTIONS
HRTF interpolation options for hades_synthesis.
Definition saf_hades_synthesis.h:79

CxMic
Helper struct for averaging covariance matrices (block-wise)
Definition saf_hades_internal.h:56

hades_analysis_data
Main structure for hades analysis.
Definition saf_hades_internal.h:66

hades_analysis_data::nMics
int nMics
Number of microphones.
Definition saf_hades_internal.h:76

hades_analysis_data::covAvgCoeff
float covAvgCoeff
Temporal averaging coefficient [0 1].
Definition saf_hades_internal.h:82

hades_analysis_data::T
float_complex ** T
for covariance whitening; nBands x (nMics x nMics)
Definition saf_hades_internal.h:96

hades_analysis_data::blocksize
int blocksize
Number of samples to process at a time (note that 1 doa and diffuseness estimate is made per block)
Definition saf_hades_internal.h:71

hades_analysis_data::hybridmode
int hybridmode
Optionally, the lowest TF bands may be subdivided to improve low-freq resolution.
Definition saf_hades_internal.h:72

hades_analysis_data::hEig
void * hEig
handle for the eigen solver
Definition saf_hades_internal.h:95

hades_analysis_data::DCM_array
float_complex * DCM_array
Diffuse covariance matrix (computed over all grid directions and weighted); FLAT: nBands x nMics x nM...
Definition saf_hades_internal.h:90

hades_analysis_data::grid_dirs_xyz
float * grid_dirs_xyz
Scanning grid coordinates (unit vectors and only used by grid-based estimators); FLAT: nGrid x 3.
Definition saf_hades_internal.h:98

hades_analysis_data::h_array
float * h_array
Array impulse responses; FLAT: nGrid x nMics x h_len.
Definition saf_hades_internal.h:73

hades_analysis_data::freqVector
float * freqVector
Centre frequencies; nBands x 1.
Definition saf_hades_internal.h:89

hades_analysis_data::doaOpt
HADES_DOA_ESTIMATORS doaOpt
see HADES_DOA_ESTIMATORS
Definition saf_hades_internal.h:79

hades_analysis_data::grid_dirs_deg
float * grid_dirs_deg
Array grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:74

hades_analysis_data::inputBlock
float ** inputBlock
Input frame; nMics x blocksize.
Definition saf_hades_internal.h:102

hades_analysis_data::hopsize
int hopsize
Filterbank hop size (blocksize must be divisable by this.
Definition saf_hades_internal.h:70

hades_analysis_data::V
float_complex * V
Eigen vectors; FLAT: nMics x nMics.
Definition saf_hades_internal.h:104

hades_analysis_data::fbOpt
HADES_FILTERBANKS fbOpt
see HADES_FILTERBANKS
Definition saf_hades_internal.h:69

hades_analysis_data::H_array_w
float_complex * H_array_w
Array IRs in the frequency domain spatially weightend; FLAT: nBands x nMics x nDirs.
Definition saf_hades_internal.h:92

hades_analysis_data::hFB_enc
void * hFB_enc
Time-frequency transform handle.
Definition saf_hades_internal.h:85

hades_analysis_data::W
float_complex * W
Diffuse integration weighting matrix; FLAT: nGrid x nGrid.
Definition saf_hades_internal.h:99

hades_analysis_data::h_len
int h_len
Length of impulse responses, in samples.
Definition saf_hades_internal.h:77

hades_analysis_data::lambda
float * lambda
Eigenvalues; nMics x 1.
Definition saf_hades_internal.h:106

hades_analysis_data::Cx
CxMic * Cx
Current (time-averaged) covariance matrix per band; nBands x 1.
Definition saf_hades_internal.h:103

hades_analysis_data::H_array
float_complex * H_array
Array IRs in the frequency domain; FLAT: nBands x nMics x nDirs.
Definition saf_hades_internal.h:91

hades_analysis_data::fs
float fs
Host samplerate, Hz.
Definition saf_hades_internal.h:68

hades_analysis_data::filterbankDelay
int filterbankDelay
Filterbank delay, in time-domain samples.
Definition saf_hades_internal.h:88

hades_analysis_data::nBands
int nBands
Number of frequency bands.
Definition saf_hades_internal.h:86

hades_analysis_data::hDoA
void * hDoA
DoA estimator handle.
Definition saf_hades_internal.h:97

hades_analysis_data::timeSlots
int timeSlots
Number of time slots.
Definition saf_hades_internal.h:87

hades_analysis_data::Vn
float_complex * Vn
Noise subspace; FLAT: nMics x (nMics-1)
Definition saf_hades_internal.h:105

hades_analysis_data::diffOpt
HADES_DIFFUSENESS_ESTIMATORS diffOpt
see HADES_DIFFUSENESS_ESTIMATORS
Definition saf_hades_internal.h:78

hades_analysis_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:75

hades_binaural_config
Binaural configuration struct.
Definition saf_hades_synthesis.h:60

hades_param_container_data
Parameter container to store the data from an analyser for one blocksize of audio.
Definition saf_hades_internal.h:169

hades_param_container_data::gains_idx
int * gains_idx
Reproduction direction index per band; nBands x 1.
Definition saf_hades_internal.h:175

hades_param_container_data::doa_idx
int * doa_idx
Beamforming direction index per band; nBands x 1.
Definition saf_hades_internal.h:174

hades_param_container_data::diffuseness
float * diffuseness
Diffuseness value per band; nBands x 1.
Definition saf_hades_internal.h:173

hades_param_container_data::gains_diff
float * gains_diff
Extra diffuse reproduction gain per band (default=1.0f); nBands x 1.
Definition saf_hades_internal.h:179

hades_param_container_data::nBands
int nBands
Number of bands.
Definition saf_hades_internal.h:170

hades_param_container_data::gains_dir
float * gains_dir
Extra direct reproduction gain per band (default=1.0f); nBands x 1.
Definition saf_hades_internal.h:178

hades_radial_editor_data
Main structure for hades radial (360degree) gain and direct-to-diffuse ratio editor.
Definition saf_hades_internal.h:184

hades_radial_editor_data::pGrid_dirs_deg
float * pGrid_dirs_deg
Pointer to grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:187

hades_radial_editor_data::pGrid_dirs_xyz
float * pGrid_dirs_xyz
Pointer to grid dirs as Cartesian coordinates of unit length; FLAT: nGrid x 3.
Definition saf_hades_internal.h:188

hades_radial_editor_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:186

hades_radial_editor_data::nBands
int nBands
Number of bands.
Definition saf_hades_internal.h:185

hades_signal_container_data
Signal container to store one block of TF-domain audio data.
Definition saf_hades_internal.h:193

hades_signal_container_data::nBands
int nBands
Number of bands in the time-frequency transform.
Definition saf_hades_internal.h:195

hades_signal_container_data::nMics
int nMics
Number of spherical harmonic components.
Definition saf_hades_internal.h:194

hades_signal_container_data::timeSlots
int timeSlots
Number of time frames in time-frequency transform.
Definition saf_hades_internal.h:196

hades_signal_container_data::Cx
CxMic * Cx
NON-time-averaged covariance matrix per band; nBands x .Cx(nMics x nMics)
Definition saf_hades_internal.h:199

hades_signal_container_data::inTF
float_complex *** inTF
Input frame in TF-domain; nBands x nMics x timeSlots.
Definition saf_hades_internal.h:202

hades_synthesis_data
Main structure for hades synthesis.
Definition saf_hades_internal.h:112

hades_synthesis_data::outTD
float ** outTD
output time-domain buffer; NUM_EARS x blocksize
Definition saf_hades_internal.h:164

hades_synthesis_data::hLinSolve
void * hLinSolve
Handle for solving linear equations (Ax=b)
Definition saf_hades_internal.h:150

hades_synthesis_data::blocksize
int blocksize
blocksize in samples
Definition saf_hades_internal.h:129

hades_synthesis_data::hCDF
void * hCDF
Handle for solving the covariance matching problem.
Definition saf_hades_internal.h:151

hades_synthesis_data::M
float_complex ** M
Mixing matrix per band; nBands x FLAT: (NUM_EARS x nMics)
Definition saf_hades_internal.h:160

hades_synthesis_data::synAvgCoeff
float synAvgCoeff
Mixing matrix averaging coefficent [0..1].
Definition saf_hades_internal.h:123

hades_synthesis_data::fbOpt
HADES_FILTERBANKS fbOpt
Filterbank option, see HADES_FILTERBANKS.
Definition saf_hades_internal.h:126

hades_synthesis_data::new_M
float_complex * new_M
New mixing matrix (not yet temporally averaged); FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:159

hades_synthesis_data::nBands
int nBands
Number of bands in the time-frequency transform domain.
Definition saf_hades_internal.h:127

hades_synthesis_data::H_array
float_complex * H_array
Array IRs in the frequency domain; FLAT: nBands x nMics x nGrid.
Definition saf_hades_internal.h:132

hades_synthesis_data::As
float_complex * As
Array steering vector for DoA; FLAT: nMics x 1.
Definition saf_hades_internal.h:152

hades_synthesis_data::eq
float * eq
Gain factor per band; nBands x 1.
Definition saf_hades_internal.h:121

hades_synthesis_data::timeSlots
int timeSlots
Number of time frames in the time-frequency transform domain.
Definition saf_hades_internal.h:135

hades_synthesis_data::H_bin
float_complex * H_bin
To spatialise the source beamformers; FLAT: nBands x NUM_EARS x nGrid.
Definition saf_hades_internal.h:144

hades_synthesis_data::beamOption
HADES_BEAMFORMER_TYPE beamOption
see HADES_BEAMFORMER_TYPE
Definition saf_hades_internal.h:114

hades_synthesis_data::enableCM
int enableCM
Flag: whether the spatial covariance matching is enabled (1) or disabled (0)
Definition saf_hades_internal.h:115

hades_synthesis_data::binConfig
hades_binaural_config * binConfig
Internal copy of user configuration.
Definition saf_hades_internal.h:116

hades_synthesis_data::freqVector
float * freqVector
Frequency vector (band centre frequencies); nBands x 1.
Definition saf_hades_internal.h:136

hades_synthesis_data::grid_dirs_deg
float * grid_dirs_deg
Array grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:133

hades_synthesis_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:130

hades_synthesis_data::Q
float_complex * Q
Mixing matrix for the direct and diffuse streams combined (based on the diffuseness value); FLAT: NUM...
Definition saf_hades_internal.h:157

hades_synthesis_data::As_r
float_complex * As_r
Array steering vector relative to right reference sensor; FLAT: nMics x 1.
Definition saf_hades_internal.h:154

hades_synthesis_data::diffEQ
float * diffEQ
EQ curve to bring the overall diffuse-field magnitude response of the array to that of the HRTFs inst...
Definition saf_hades_internal.h:146

hades_synthesis_data::hPinv
void * hPinv
Handle for computing the Moore-Penrose pseudo inverse.
Definition saf_hades_internal.h:149

hades_synthesis_data::DCM_array
float_complex * DCM_array
Diffuse coherence matrix for the array; FLAT: nBands x nMics x nMics.
Definition saf_hades_internal.h:137

hades_synthesis_data::hopsize
int hopsize
hopsize in samples
Definition saf_hades_internal.h:128

hades_synthesis_data::Cy
float_complex * Cy
Target binaural spatial covariance matrix; FLAT: NUM_EARS x NUM_EARS.
Definition saf_hades_internal.h:158

hades_synthesis_data::outTF
float_complex *** outTF
nBands x NUM_EARS x timeSlots
Definition saf_hades_internal.h:163

hades_synthesis_data::grid_dirs_xyz
float ** grid_dirs_xyz
Grid dirs as Cartesian coordinates of unit length; nGrid x 3.
Definition saf_hades_internal.h:134

hades_synthesis_data::Q_dir
float_complex * Q_dir
Mixing matrix for the direct stream; FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:156

hades_synthesis_data::DCM_bin_norm
float_complex * DCM_bin_norm
Diffuse coherence matrix for the HRTF set, normalised with 1/trace(DCM_bin); FLAT: nBands x nMics x n...
Definition saf_hades_internal.h:145

hades_synthesis_data::W
float_complex * W
Diffuse integration weighting matrix; FLAT: nGrid x nGrid.
Definition saf_hades_internal.h:138

hades_synthesis_data::Q_diff
float_complex * Q_diff
Mixing matrix for the diffuse stream; FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:155

hades_synthesis_data::interpOption
HADES_HRTF_INTERP_OPTIONS interpOption
HRIR interpolation option, see HADES_HRTF_INTERP_OPTIONS.
Definition saf_hades_internal.h:118

hades_synthesis_data::As_l
float_complex * As_l
Array steering vector relative to left reference sensor; FLAT: nMics x 1.
Definition saf_hades_internal.h:153

hades_synthesis_data::refIndices
int refIndices[2]
Indices into [0 nMics-1], defining the reference sensors.
Definition saf_hades_internal.h:117

hades_synthesis_data::hFB_dec
void * hFB_dec
Filterbank handle.
Definition saf_hades_internal.h:141

hades_synthesis_data::nMics
int nMics
Number of microphones.
Definition saf_hades_internal.h:131

hades_synthesis_data::streamBalance
float * streamBalance
Stream balance per band (0:fully diffuse, 1:balanced, 2:fully direct); nBands x 1.
Definition saf_hades_internal.h:122