Spatial_Audio_Framework/saf__hades__synthesis_8c_source.html

/*

 * This file is part of the saf_hades module.

 * Copyright (c) 2021 - Leo McCormack & Janani Fernandez

 *

 * The saf_hades module is free software; you can redistribute it and/or

 * modify it under the terms of the GNU General Public License as published by

 * the Free Software Foundation; either version 2 of the License, or (at your

 * option) any later version.

 *

 * The saf_hades module is distributed in the hope that it will be useful, but

 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY

 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for

 * more details.

 *

 * See <http://www.gnu.org/licenses/> for a copy of the GNU General Public

 * License.

 */


#include "saf_hades_synthesis.h"

#include "saf_hades_internal.h"


#ifdef  SAF_ENABLE_HADES_MODULE


/* ========================================================================== */

/*                            HADES Radial Editor                             */

/* ========================================================================== */


void hades_radial_editor_create

(

    hades_radial_editor_handle* const phREd,

    hades_analysis_handle const hAna

)

{

    hades_radial_editor_data* e = (hades_radial_editor_data*)malloc1d(sizeof(hades_radial_editor_data));

    *phREd = (hades_radial_editor_handle)e;

    hades_analysis_data *a = (hades_analysis_data*)(hAna);


    e->nBands = a->nBands;

    e->nGrid = a->nGrid;

    e->pGrid_dirs_deg = a->grid_dirs_deg;

    e->pGrid_dirs_xyz = a->grid_dirs_xyz;

}


void hades_radial_editor_destroy

(

    hades_radial_editor_handle* const phREd

)

{

    hades_radial_editor_data *e = (hades_radial_editor_data*)(*phREd);


    if (e != NULL) {

        free(e);

        e = NULL;

        (*phREd) = NULL;

    }

}


void hades_radial_editor_apply

(

    hades_radial_editor_handle const hREd,

    hades_param_container_handle  const hPCon,

    float dirGain_dB[360]

)

{

    hades_radial_editor_data *e = (hades_radial_editor_data*)(hREd);

    hades_param_container_data *pcon = (hades_param_container_data*)(hPCon);

    int band, edit_idx;

    float azi, gain_lin;


    for(band=0; band<e->nBands; band++){

        /* Determine edit index */

        azi = e->pGrid_dirs_deg[pcon->gains_idx[band]*2];

        azi = azi < 0.0f ? azi+360.0f : azi;             /* convert -180..180 if needed */

        edit_idx = SAF_CLAMP((int)(azi + 0.5f), 0, 359); /* round to nearest integer */


        /* Extra gain factor for the direct stream */

        gain_lin = powf(10.0f, SAF_CLAMP(dirGain_dB[edit_idx], -60.0f, 12.0f)/20.0f);

        pcon->gains_dir[band] *= gain_lin;

    }

}


/* ========================================================================== */

/*                             HADES Synthesis                              */

/* ========================================================================== */


void hades_synthesis_create

(

    hades_synthesis_handle* const phSyn,

    hades_analysis_handle const hAna,

    HADES_BEAMFORMER_TYPE beamOption,

    int enableCM,

    int refIndices[2],

    hades_binaural_config* binConfig,

    HADES_HRTF_INTERP_OPTIONS interpOption

)

{

    hades_synthesis_data* s = (hades_synthesis_data*)malloc1d(sizeof(hades_synthesis_data));

    *phSyn = (hades_synthesis_handle)s;

    hades_analysis_data *a = (hades_analysis_data*)(hAna);

    int band;

    float_complex* H_W;

    hades_binaural_config* bConfig;

    const float_complex calpha = cmplxf(1.0f, 0.0f); const float_complex cbeta = cmplxf(0.0f, 0.0f); /* blas */


    /* User configuration parameters */

    s->beamOption = beamOption;

    s->enableCM = enableCM;

    s->refIndices[0] = refIndices[0];

    s->refIndices[1] = refIndices[1];

    s->interpOption = interpOption;


    /* Default user parameters */

    s->eq = malloc1d(a->nBands * sizeof(float));

    s->streamBalance = malloc1d(a->nBands * sizeof(float));

    for(band = 0; band<a->nBands; band++){

        s->eq[band] = 1.0;             /* Flat EQ */

        s->streamBalance[band] = 1.0f; /* 50/50 direct/ambient balance (i.e., no biasing) */

    }

    s->synAvgCoeff = 1.0f - 1.0f/(4096.0f/a->blocksize); /* How much averaging of current mixing matrices with the previous mixing matrices */


    /* Things relevant to the synthesiser, which are copied from the analyser to keep things aligned */

    s->fbOpt = a->fbOpt;

    s->nBands = a->nBands;

    s->hopsize = a->hopsize;

    s->blocksize = a->blocksize;

    s->nGrid = a->nGrid;

    s->nMics = a->nMics;

    s->H_array = malloc1d(s->nBands*(s->nMics)*(s->nGrid)*sizeof(float_complex));

    memcpy(s->H_array, a->H_array, s->nBands*(s->nMics)*(s->nGrid)*sizeof(float_complex));

    s->DCM_array = malloc1d(s->nBands*(s->nMics)*(s->nMics)*sizeof(float_complex));

    memcpy(s->DCM_array, a->DCM_array, s->nBands*(s->nMics)*(s->nMics)*sizeof(float_complex));

    s->W = malloc1d(s->nGrid*(s->nGrid)*sizeof(float_complex));

    memcpy(s->W, a->W, s->nGrid*(s->nGrid)*sizeof(float_complex));

    s->grid_dirs_deg = malloc1d((s->nGrid)*2*sizeof(float));

    memcpy(s->grid_dirs_deg, a->grid_dirs_deg, (s->nGrid)*2*sizeof(float));

    s->grid_dirs_xyz = (float**)malloc2d((s->nGrid), 3, sizeof(float));

    memcpy(FLATTEN2D(s->grid_dirs_xyz), a->grid_dirs_xyz, (s->nGrid)*3*sizeof(float));

    s->timeSlots = a->timeSlots;

    s->freqVector = malloc1d(s->nBands*sizeof(float));

    memcpy(s->freqVector, a->freqVector, s->nBands*sizeof(float));


    /* Time-frequency transform */

    switch(s->fbOpt){

        case HADES_USE_AFSTFT_LD: afSTFT_create(&(s->hFB_dec), 0, NUM_EARS, s->hopsize, 1, a->hybridmode, AFSTFT_BANDS_CH_TIME); break;

        case HADES_USE_AFSTFT:    afSTFT_create(&(s->hFB_dec), 0, NUM_EARS, s->hopsize, 0, a->hybridmode, AFSTFT_BANDS_CH_TIME); break;

    }


    /* Copy binaural configuration */

    s->binConfig = malloc1d(sizeof(hades_binaural_config));

    bConfig = s->binConfig;

    bConfig->lHRIR = binConfig->lHRIR;

    bConfig->nHRIR = binConfig->nHRIR;

    bConfig->hrir_fs = binConfig->hrir_fs;

    bConfig->hrirs = malloc1d(bConfig->nHRIR * NUM_EARS * (bConfig->lHRIR) * sizeof(float));

    memcpy(bConfig->hrirs, binConfig->hrirs, bConfig->nHRIR * NUM_EARS * (bConfig->lHRIR) * sizeof(float));

    bConfig->hrir_dirs_deg = malloc1d(bConfig->nHRIR*2*sizeof(float));

    memcpy(bConfig->hrir_dirs_deg, binConfig->hrir_dirs_deg, bConfig->nHRIR*2*sizeof(float));


    /* Pre-process HRTFs, interpolate them for the scanning grid */

    s->H_bin = calloc1d(s->nBands*NUM_EARS*(s->nGrid),sizeof(float_complex));

    hades_getInterpolatedHRTFs(hAna, interpOption, bConfig, a->grid_dirs_deg, s->nGrid, s->H_bin);


    /* Diffuse rendering variables */

    s->DCM_bin_norm = malloc1d(a->nBands*NUM_EARS*NUM_EARS*sizeof(float_complex));

    H_W = malloc1d(NUM_EARS*(a->nGrid)*sizeof(float_complex));

    s->diffEQ = malloc1d(a->nBands*sizeof(float));

    for(band=0; band<s->nBands; band++){

        /* Binaural diffuse coherence matrix (not normalised yet!) */

        cblas_cgemm(CblasRowMajor, CblasNoTrans, CblasNoTrans, NUM_EARS, a->nGrid, a->nGrid, &calpha,

                    &(s->H_bin[band*NUM_EARS*(a->nGrid)]), a->nGrid,

                    a->W, a->nGrid, &cbeta,

                    H_W, a->nGrid);

        cblas_cgemm(CblasRowMajor, CblasNoTrans, CblasConjTrans, NUM_EARS, NUM_EARS, a->nGrid, &calpha,

                    H_W, a->nGrid,

                    &(s->H_bin[band*NUM_EARS*(a->nGrid)]), a->nGrid, &cbeta,

                    &(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]), NUM_EARS);

        cblas_sscal(/*re+im*/2*NUM_EARS*NUM_EARS, 1.0f/(float)a->nGrid, (float*)&(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]), 1);


        /* Compute EQ required to bring the overall diffuse-field magnitude response of the array to that of the HRTFs instead: */

        /* sqrt(trace(H_bin_dcm(:,:,band))/(trace(H_grid_dcm(refIndices,refIndices,band))+eps)) */

        s->diffEQ[band] = sqrtf((crealf(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]) + crealf(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS + 3])) /

                                (crealf(s->DCM_array[band*(s->nMics)*(s->nMics) + s->refIndices[0]*(s->nMics) + s->refIndices[0]]) +

                                 crealf(s->DCM_array[band*(s->nMics)*(s->nMics) + s->refIndices[1]*(s->nMics) + s->refIndices[1]]) + 2.23e-10f));

        s->diffEQ[band] = SAF_MIN(s->diffEQ[band], 3.0f); /* Cap at a maximum of +9dB */


        /* Normalise the binaural diffuse coherence matrix */

        cblas_sscal(/*re+im*/2*NUM_EARS*NUM_EARS, 1.0f/(crealf(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]) + crealf(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS + 3]) + 2.23e-10f),

                    (float*)&(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]), 1);

    }

    free(H_W);


    /* Run-time variables */

    utility_cpinv_create(&(s->hPinv), s->nMics, s->nMics);

    utility_cglslv_create(&(s->hLinSolve), s->nMics, s->nMics);

    cdf4sap_cmplx_create(&(s->hCDF), s->nMics, NUM_EARS);

    s->As   = malloc1d(s->nMics*sizeof(float_complex));

    s->As_l = malloc1d(s->nMics*sizeof(float_complex));

    s->As_r = malloc1d(s->nMics*sizeof(float_complex));

    s->Q_diff = malloc1d(NUM_EARS*(s->nMics)*sizeof(float_complex));

    s->Q_dir  = malloc1d(NUM_EARS*(s->nMics)*sizeof(float_complex));

    s->Q      = malloc1d(NUM_EARS*(s->nMics)*sizeof(float_complex));

    s->Cy = malloc1d(NUM_EARS*NUM_EARS*sizeof(float_complex));

    s->new_M = malloc1d(NUM_EARS*(s->nMics)*sizeof(float_complex));

    s->M  = (float_complex**)malloc2d(s->nBands, NUM_EARS*(s->nMics), sizeof(float_complex));


    /* Run-time audio buffers */

    s->outTF = (float_complex***)malloc3d(s->nBands, NUM_EARS, s->timeSlots, sizeof(float_complex));

    s->outTD = (float**)malloc2d(NUM_EARS, s->blocksize, sizeof(float));


    /* Flush run-time buffers with zeros */

    hades_synthesis_reset((*phSyn));

}


void hades_synthesis_destroy

(

    hades_synthesis_handle* const phSyn

)

{

    hades_synthesis_data *s = (hades_synthesis_data*)(*phSyn);


    if (s != NULL) {

        /* Free user parameters */

        free(s->eq);

        free(s->streamBalance);

        free(s->binConfig);


        /* Free things copied from analyser */

        free(s->H_array);

        free(s->DCM_array);

        free(s->W);

        free(s->grid_dirs_deg);

        free(s->grid_dirs_xyz);

        free(s->freqVector);


        /* Free time-frequency transform */

        switch(s->fbOpt){

            case HADES_USE_AFSTFT_LD: /* fall through */

            case HADES_USE_AFSTFT:    afSTFT_destroy(&(s->hFB_dec)); break;

        }


        /* HRTF and diffuse rendering variables */

        free(s->H_bin);

        free(s->DCM_bin_norm);

        free(s->diffEQ);


        /* Run-time variables */

        utility_cpinv_destroy(&(s->hPinv));

        utility_cglslv_destroy(&(s->hLinSolve));

        cdf4sap_cmplx_destroy(&(s->hCDF));

        free(s->As);

        free(s->As_l);

        free(s->As_r);

        free(s->Q_diff);

        free(s->Q_dir);

        free(s->Q);

        free(s->Cy);

        free(s->new_M);

        free(s->M);


        /* Run-time audio buffers */

        free(s->outTF);

        free(s->outTD);


        free(s);

        s = NULL;

        (*phSyn) = NULL;

    }

}


void hades_synthesis_reset

(

    hades_synthesis_handle const hSyn

)

{

    hades_synthesis_data *s;

    if(hSyn==NULL)

        return;

    s = (hades_synthesis_data*)(hSyn);


    /* Zero buffers, matrices etc. */

    switch(s->fbOpt){

        case HADES_USE_AFSTFT_LD: /* fall through */

        case HADES_USE_AFSTFT:    afSTFT_clearBuffers(s->hFB_dec); break;

    }

    memset(FLATTEN2D(s->M), 0, s->nBands*NUM_EARS*(s->nMics)*sizeof(float_complex));

}


void hades_synthesis_apply

(

    hades_synthesis_handle const hSyn,

    hades_param_container_handle  const hPCon,

    hades_signal_container_handle const hSCon,

    int nChannels,

    int blocksize,

    float** output

)

{

    hades_synthesis_data *s = (hades_synthesis_data*)(hSyn);

    hades_param_container_data *pcon = (hades_param_container_data*)(hPCon);

    hades_signal_container_data *scon = (hades_signal_container_data*)(hSCon);

    int i, j, ch, nMics, band, doa_idx, gain_idx;

    float a, b, diffuseness, synAvgCoeff, streamBalance, eq, gain_dir, gain_diff, trace_M, reg_M, sum_As, targetEnergy;

    float_complex g_l, g_r, h_dir[NUM_EARS], AsH_invCx_As;

    float_complex Cx[HADES_MAX_NMICS*HADES_MAX_NMICS], conj_As[HADES_MAX_NMICS], AsH_invCx[HADES_MAX_NMICS*HADES_MAX_NMICS];

    const float_complex calpha = cmplxf(1.0f, 0.0f); const float_complex cbeta = cmplxf(0.0f, 0.0f); /* blas */


    nMics = s->nMics;

    synAvgCoeff = SAF_CLAMP((s->synAvgCoeff), 0.0f, 0.99f);


    /* Loop over bands and compute the mixing matrices */

    for (band = 0; band < s->nBands; band++) {

        /* Pull estimated (and possibly modified) spatial parameters for this band */

        diffuseness = pcon->diffuseness[band];

        saf_assert(diffuseness>-0.0001f && diffuseness < 1.00001f, "Erroneous parameter analysis");

        doa_idx = pcon->doa_idx[band];

        gain_idx = pcon->gains_idx[band];

        gain_dir  = pcon->gains_dir[band];

        gain_diff = pcon->gains_diff[band];


        /* Optional biasing (e.g. to conduct de-reverberation or to emphasise reverberation) */

        streamBalance = SAF_CLAMP(s->streamBalance[band], 0.0f, 2.0f);

        eq = s->eq[band];

        if(streamBalance<1.0f){

            a = streamBalance;        /* pump more direct energy into output */

            b = 1.0f;                 /* pass ambient stream as normal */

        }

        else {

            a = 1.0f;                 /* pass source stream as normal */

            b = 2.0f - streamBalance; /* pump less ambient energy into output */

        }

        a *= gain_dir;

        b *= gain_diff;


        /* Source array steering vector for the estimated DoAs */

        for(i=0; i<nMics; i++)

            s->As[i] = s->H_array[band*nMics*(s->nGrid) + i*(s->nGrid) + doa_idx];


        /* Anechoic relative transfer functions (RTFs) */

        for(i=0; i<nMics; i++){

            s->As_l[i] = ccdivf(s->As[i], s->As[s->refIndices[0]]);

            s->As_r[i] = ccdivf(s->As[i], s->As[s->refIndices[1]]);

        }


        /* HRTF for this reproduction DoA */

        h_dir[0] = s->H_bin[band*NUM_EARS*(s->nGrid) + 0*(s->nGrid) + gain_idx];

        h_dir[1] = s->H_bin[band*NUM_EARS*(s->nGrid) + 1*(s->nGrid) + gain_idx];

        g_l = ccdivf(h_dir[0], s->As[s->refIndices[0]]); /* (Relative transfer functions) */

        g_r = ccdivf(h_dir[1], s->As[s->refIndices[1]]);

        if(cabsf(g_l)>4.0f || cabsf(g_r)>4.0f) /* if >12dB, then bypass: */

            g_l = g_r = cmplxf(1.0f, 0.0f);


        /* Diffuse mixing matrix (if the sound-field is analysed to be more diffuse, then we mix in more of just the reference sensors) */

        memset(s->Q_diff, 0, NUM_EARS*nMics*sizeof(float_complex));

        s->Q_diff[0*nMics+s->refIndices[0]] = cmplxf(s->diffEQ[band], 0.0f);

        s->Q_diff[1*nMics+s->refIndices[1]] = cmplxf(s->diffEQ[band], 0.0f);


        /* Source mixing matrix (beamforming towards the estimated DoAs) */

        switch(s->beamOption){

            case HADES_BEAMFORMER_NONE: /* No beamforming required */ break;

            case HADES_BEAMFORMER_FILTER_AND_SUM:

                /* Normalise the beamformers to unity gain in the look direction */

                utility_cpinv(s->hPinv, s->As_l, nMics, 1, s->Q_dir);

                utility_cpinv(s->hPinv, s->As_r, nMics, 1, s->Q_dir + nMics);


                /* Now bring their response from being w.r.t the array to being w.r.t the HRTF instead */

                cblas_cscal(nMics, &g_l, s->Q_dir, 1);

                cblas_cscal(nMics, &g_r, s->Q_dir + nMics, 1);

                break;


            case HADES_BEAMFORMER_BMVDR:

                /* prep */

                cblas_ccopy(nMics*nMics, scon->Cx[band].Cx, 1, Cx, 1);

                trace_M = 0.0f;

                for(i=0; i<nMics; i++)

                    trace_M += crealf(Cx[i*nMics+i]);

                sum_As = cblas_scasum(nMics, s->As, 1);


                /* Compute beamforming weights if checks pass */

                if( trace_M < 0.0001f || sum_As < 0.0001f)

                    memset(s->Q_dir, 0, NUM_EARS*nMics*sizeof(float_complex));

                else{

                    /* Regularise Cx */

                    reg_M = (trace_M/(float)nMics) * 10.0f + 0.0001f;

                    for(i=0; i<nMics; i++)

                        Cx[i*nMics+i] = craddf(Cx[i*nMics+i], reg_M);


                    /* Compute MVDR weights w.r.t the reference sensor at each ear, [As^H Cx^-1 As]^-1 As^H Cx^-1  */

                    for(j=0; j<NUM_EARS; j++){

                        /* Solve As^H Cx-1 */

                        utility_cvconj(j==0 ? s->As_l : s->As_r, nMics, conj_As);

                        utility_cglslv(s->hLinSolve, Cx, nMics, conj_As, 1, AsH_invCx);


                        /* Compute As^H Cx-1 As */

                        utility_cvvdot(AsH_invCx, j==0 ? s->As_l : s->As_r, nMics, NO_CONJ, &AsH_invCx_As);

                        AsH_invCx_As = craddf(AsH_invCx_As, 0.00001f);


                        /* The solution */

                        AsH_invCx_As = ccdivf(cmplxf(1.0f, 0.0f), AsH_invCx_As);

                        cblas_cscal(nMics, &AsH_invCx_As, AsH_invCx, 1);

                        cblas_ccopy(nMics, AsH_invCx, 1, s->Q_dir + j*nMics, 1);

                    }


                    /* Now bring their response from being w.r.t the array to instead being w.r.t the HRTF */

                    cblas_cscal(nMics, &g_l, s->Q_dir, 1);

                    cblas_cscal(nMics, &g_r, s->Q_dir + nMics, 1);

                }

                break;

        }


        /* Prototype mixing matrix */

        if(s->beamOption==HADES_BEAMFORMER_NONE){

            /* No beamforming (just pass through the reference signals) */

            memset(s->Q, 0, NUM_EARS*nMics*sizeof(float_complex));

            s->Q[0*nMics+s->refIndices[0]] = cmplxf(1.0f, 0.0f);

            s->Q[1*nMics+s->refIndices[1]] = cmplxf(1.0f, 0.0f);

            //s->Q[0*nMics+s->refIndices[0]] = cmplxf(s->diffEQ[band], 0.0f);

            //s->Q[1*nMics+s->refIndices[1]] = cmplxf(s->diffEQ[band], 0.0f);

        }

        else{

            /* Mix in the beamforming weights, conforming to the assumed direct-diffuse model */

            cblas_ccopy(NUM_EARS*nMics, s->Q_dir, 1, s->Q, 1);

            cblas_sscal(/*re+im*/2*NUM_EARS*nMics, eq*a*(1.0f-diffuseness), (float*)s->Q, 1);

            cblas_saxpy(/*re+im*/2*NUM_EARS*nMics, eq*b*diffuseness, (float*)s->Q_diff, 1, (float*)s->Q, 1);

        }


        /* Target output signal energy (used for the covariance matching) */

        targetEnergy = 0.0f;

        for(i=0; i<nMics; i++)

            targetEnergy += crealf(scon->Cx[band].Cx[i*nMics+i]);

        targetEnergy = eq*0.25f*targetEnergy * s->diffEQ[band];


        /* Final mixing matrix */

        if(s->enableCM && targetEnergy>0.0001f){

            /* "Direct" contributions to the target spatial covariance matrix */

            cblas_cgemm(CblasRowMajor, CblasNoTrans, CblasConjTrans, NUM_EARS, NUM_EARS, 1, &calpha,

                        h_dir, 1,

                        h_dir, 1, &cbeta,

                        s->Cy, NUM_EARS);

            cblas_sscal(/*re+im*/2*NUM_EARS*NUM_EARS, eq*a*(1.0f-diffuseness)*targetEnergy, (float*)s->Cy, 1);


            /* "Diffuse" contributions to the target spatial covariance matrix */

            cblas_saxpy(/*re+im*/2*NUM_EARS*NUM_EARS, eq*b*diffuseness*targetEnergy, (float*)&(s->DCM_bin_norm[band*NUM_EARS*NUM_EARS]), 1, (float*)s->Cy, 1);


            /* Solve the covariance matching problem */

            formulate_M_and_Cr_cmplx(s->hCDF, (float_complex*)scon->Cx[band].Cx, s->Cy, s->Q, 1, 0.1f, s->new_M, NULL);

        }

        else

            cblas_ccopy(NUM_EARS*nMics, s->Q, 1, s->new_M, 1);


        /* Optional Equalisation */

        cblas_sscal(/*re+im*/2*NUM_EARS*nMics, eq, (float*)s->new_M, 1);


        /* Temporal averaging of mixing matrices */

        cblas_sscal(/*re+im*/2*NUM_EARS*nMics, synAvgCoeff, (float*)s->M[band], 1);

        cblas_saxpy(/*re+im*/2*NUM_EARS*nMics, 1.0f-synAvgCoeff, (float*)s->new_M, 1, (float*)s->M[band], 1);

    }


    /* Apply mixing matrices */

    for(band=0; band<s->nBands; band++){

        cblas_cgemm(CblasRowMajor, CblasNoTrans, CblasNoTrans, NUM_EARS, s->timeSlots, nMics, &calpha,

                    s->M[band], nMics,

                    FLATTEN2D(scon->inTF[band]), s->timeSlots, &cbeta,

                    FLATTEN2D(s->outTF[band]), s->timeSlots);

    }


    /* inverse time-frequency transform */

    switch(s->fbOpt){

        case HADES_USE_AFSTFT_LD: /* fall through */

        case HADES_USE_AFSTFT:    afSTFT_backward_knownDimensions(s->hFB_dec, s->outTF, blocksize, NUM_EARS, s->timeSlots, s->outTD);   break;

    }


    /* Copy to output */

    for(ch=0; ch<SAF_MIN(nChannels, NUM_EARS); ch++)

        memcpy(output[ch], s->outTD[ch], blocksize*sizeof(float));

    for(; ch<nChannels; ch++)

        memset(output[ch], 0, blocksize*sizeof(float));

}


float* hades_synthesis_getEqPtr

(

    hades_synthesis_handle const hSyn,

    int* nBands

)

{

    hades_synthesis_data *s;

    if(hSyn==NULL){

        if(nBands!=NULL)

            (*nBands) = 0;

        return NULL;

    }

    s = (hades_synthesis_data*)(hSyn);

    if(nBands!=NULL)

       (*nBands) = s->nBands;

    return s->eq;

}


float* hades_synthesis_getStreamBalancePtr

(

    hades_synthesis_handle const hSyn,

    int* nBands

)

{

    hades_synthesis_data *s;

    if(hSyn==NULL){

        if(nBands!=NULL)

            (*nBands) = 0;

        return NULL;

    }

    s = (hades_synthesis_data*)(hSyn);

    if(nBands!=NULL)

       (*nBands) = s->nBands;

    return s->streamBalance;

}


float* hades_synthesis_getSynthesisAveragingCoeffPtr

(

    hades_synthesis_handle const hSyn

)

{

    hades_synthesis_data *s;

    if(hSyn==NULL)

        return NULL;

    s = (hades_synthesis_data*)(hSyn);

    return &(s->synAvgCoeff);

}


int hades_synthesis_getProcDelay

(

    hades_synthesis_handle const hSyn

)

{

    if(hSyn==NULL)

        return 0;

    return 0; /* Accounted for in hades_analysis_getProcDelay() */

}


#endif /* SAF_ENABLE_HADES_MODULE */

afSTFT_clearBuffers
void afSTFT_clearBuffers(void *const hSTFT)
Flushes time-domain buffers with zeros.
Definition afSTFTlib.c:519

afSTFT_create
void afSTFT_create(void **const phSTFT, int nCHin, int nCHout, int hopsize, int lowDelayMode, int hybridmode, AFSTFT_FDDATA_FORMAT format)
Creates an instance of afSTFT.
Definition afSTFTlib.c:143

afSTFT_backward_knownDimensions
void afSTFT_backward_knownDimensions(void *const hSTFT, float_complex ***dataFD, int framesize, int dataFD_nCH, int dataFD_nHops, float **dataTD)
Performs backward afSTFT transform (dataFD dimensions are known)
Definition afSTFTlib.c:391

afSTFT_destroy
void afSTFT_destroy(void **const phSTFT)
Destroys an instance of afSTFT.
Definition afSTFTlib.c:199

AFSTFT_BANDS_CH_TIME
@ AFSTFT_BANDS_CH_TIME
nBands x nChannels x nTimeHops
Definition afSTFTlib.h:80

formulate_M_and_Cr_cmplx
void formulate_M_and_Cr_cmplx(void *const hCdf, float_complex *Cx, float_complex *Cy, float_complex *Q, int useEnergyFLAG, float reg, float_complex *M, float_complex *Cr)
Computes the optimal mixing matrices.
Definition saf_cdf4sap.c:407

cdf4sap_cmplx_destroy
void cdf4sap_cmplx_destroy(void **const phCdf)
Destroys an instance of the Covariance Domain Framework.
Definition saf_cdf4sap.c:234

cdf4sap_cmplx_create
void cdf4sap_cmplx_create(void **const phCdf, int nXcols, int nYcols)
Creates an instance of the Covariance Domain Framework.
Definition saf_cdf4sap.c:140

saf_assert
#define saf_assert(x, message)
Macro to make an assertion, along with a string explaining its purpose.
Definition saf_utilities.h:133

utility_cpinv_create
void utility_cpinv_create(void **const phWork, int maxDim1, int maxDim2)
(Optional) Pre-allocate the working struct used by utility_cpinv()
Definition saf_utility_veclib.c:3660

SAF_CLAMP
#define SAF_CLAMP(a, min, max)
Ensures value "a" is clamped between the "min" and "max" values.
Definition saf_utilities.h:61

utility_cglslv_destroy
void utility_cglslv_destroy(void **const phWork)
De-allocate the working struct used by utility_cglslv()
Definition saf_utility_veclib.c:2922

utility_cglslv
void utility_cglslv(void *const hWork, const float_complex *A, const int dim, float_complex *B, int nCol, float_complex *X)
General linear solver: single precision complex, i.e.
Definition saf_utility_veclib.c:2938

NUM_EARS
#define NUM_EARS
2 (true for most humans)
Definition saf_utilities.h:52

utility_cpinv
void utility_cpinv(void *const hWork, const float_complex *inM, const int dim1, const int dim2, float_complex *outM)
General matrix pseudo-inverse (the svd way): single precision complex, i.e.
Definition saf_utility_veclib.c:3696

utility_cpinv_destroy
void utility_cpinv_destroy(void **const phWork)
De-allocate the working struct used by utility_cpinv()
Definition saf_utility_veclib.c:3677

SAF_MIN
#define SAF_MIN(a, b)
Returns the minimum of the two values.
Definition saf_utilities.h:55

utility_cvvdot
void utility_cvvdot(const float_complex *a, const float_complex *b, const int len, CONJ_FLAG flag, float_complex *c)
Single-precision, complex, vector-vector dot product, i.e.
Definition saf_utility_veclib.c:1219

utility_cglslv_create
void utility_cglslv_create(void **const phWork, int maxDim, int maxNCol)
(Optional) Pre-allocate the working struct used by utility_cglslv()
Definition saf_utility_veclib.c:2909

utility_cvconj
void utility_cvconj(const float_complex *a, const int len, float_complex *c)
Single-precision, complex, vector-conjugate, i.e.
Definition saf_utility_veclib.c:549

NO_CONJ
@ NO_CONJ
Do not take the conjugate.
Definition saf_utility_veclib.h:41

malloc2d
void ** malloc2d(size_t dim1, size_t dim2, size_t data_size)
2-D malloc (contiguously allocated, so use free() as usual to deallocate)
Definition md_malloc.c:89

malloc1d
void * malloc1d(size_t dim1_data_size)
1-D malloc (same as malloc, but with error checking)
Definition md_malloc.c:59

calloc1d
void * calloc1d(size_t dim1, size_t data_size)
1-D calloc (same as calloc, but with error checking)
Definition md_malloc.c:69

malloc3d
void *** malloc3d(size_t dim1, size_t dim2, size_t dim3, size_t data_size)
3-D malloc (contiguously allocated, so use free() as usual to deallocate)
Definition md_malloc.c:151

FLATTEN2D
#define FLATTEN2D(A)
Use this macro when passing a 2-D dynamic multi-dimensional array to memset, memcpy or any other func...
Definition md_malloc.h:65

HADES_MAX_NMICS
#define HADES_MAX_NMICS
Maximum number of microphones.
Definition saf_hades_analysis.h:48

hades_analysis_handle
struct _hades_analysis_data * hades_analysis_handle
Handle for the hades analysis data.
Definition saf_hades_analysis.h:51

hades_param_container_handle
struct _hades_param_container_data * hades_param_container_handle
Handle for the hades parameter container data.
Definition saf_hades_analysis.h:54

hades_signal_container_handle
struct _hades_signal_container_data * hades_signal_container_handle
Handle for the hades signal container data.
Definition saf_hades_analysis.h:57

HADES_USE_AFSTFT
@ HADES_USE_AFSTFT
Alias-free STFT filterbank.
Definition saf_hades_analysis.h:82

HADES_USE_AFSTFT_LD
@ HADES_USE_AFSTFT_LD
Alias-free STFT filterbank (low delay)
Definition saf_hades_analysis.h:81

hades_getInterpolatedHRTFs
void hades_getInterpolatedHRTFs(hades_analysis_handle const hAna, HADES_HRTF_INTERP_OPTIONS interpOption, hades_binaural_config *binConfig, float *target_dirs_deg, int nTargetDirs, float_complex *hrtf_interp)
Binaural filter interpolator.
Definition saf_hades_internal.c:43

saf_hades_internal.h
Internal header for the HADES module (SAF_HADES_MODULE)

hades_radial_editor_destroy
void hades_radial_editor_destroy(hades_radial_editor_handle *const phREd)
Destroys an instance of a hades radial editor object.
Definition saf_hades_synthesis.c:64

hades_synthesis_getProcDelay
int hades_synthesis_getProcDelay(hades_synthesis_handle const hSyn)
Returns the synthesiser processing delay, in samples.
Definition saf_hades_synthesis.c:547

hades_radial_editor_apply
void hades_radial_editor_apply(hades_radial_editor_handle const hREd, hades_param_container_handle const hPCon, float dirGain_dB[360])
Applies the radial (360 degree) parameter editing.
Definition saf_hades_synthesis.c:78

hades_radial_editor_create
void hades_radial_editor_create(hades_radial_editor_handle *const phREd, hades_analysis_handle const hAna)
Creates and returns a handle to an instance of a hades radial editor object, which allows for directi...
Definition saf_hades_synthesis.c:48

hades_synthesis_getEqPtr
float * hades_synthesis_getEqPtr(hades_synthesis_handle const hSyn, int *nBands)
Returns a pointer to the eq vector, which can be changed at run-time.
Definition saf_hades_synthesis.c:500

hades_synthesis_getSynthesisAveragingCoeffPtr
float * hades_synthesis_getSynthesisAveragingCoeffPtr(hades_synthesis_handle const hSyn)
Returns a pointer to the synthesis averaging coefficient scalar [0..1], which can be changed at run-t...
Definition saf_hades_synthesis.c:536

hades_synthesis_apply
void hades_synthesis_apply(hades_synthesis_handle const hSyn, hades_param_container_handle const hPCon, hades_signal_container_handle const hSCon, int nChannels, int blocksize, float **output)
Performs hades synthesis.
Definition saf_hades_synthesis.c:309

hades_synthesis_create
void hades_synthesis_create(hades_synthesis_handle *const phSyn, hades_analysis_handle const hAna, HADES_BEAMFORMER_TYPE beamOption, int enableCM, int refIndices[2], hades_binaural_config *binConfig, HADES_HRTF_INTERP_OPTIONS interpOption)
Creates and returns a handle to an instance of a hades synthesis object.
Definition saf_hades_synthesis.c:107

hades_synthesis_getStreamBalancePtr
float * hades_synthesis_getStreamBalancePtr(hades_synthesis_handle const hSyn, int *nBands)
Returns a pointer to the stream balance vector [0..2], which can be changed at run-time.
Definition saf_hades_synthesis.c:518

hades_synthesis_reset
void hades_synthesis_reset(hades_synthesis_handle const hSyn)
Flushes run-time buffers with zeros.
Definition saf_hades_synthesis.c:291

hades_synthesis_destroy
void hades_synthesis_destroy(hades_synthesis_handle *const phSyn)
Destroys an instance of hades synthesis.
Definition saf_hades_synthesis.c:235

saf_hades_synthesis.h
Header for the HADES synthesis (SAF_HADES_MODULE)

hades_radial_editor_handle
struct _hades_radial_editor_data * hades_radial_editor_handle
Handle for the hades radial editor data.
Definition saf_hades_synthesis.h:53

hades_synthesis_handle
struct _hades_synthesis_data * hades_synthesis_handle
Handle for the hades synthesis data.
Definition saf_hades_synthesis.h:50

HADES_BEAMFORMER_TYPE
HADES_BEAMFORMER_TYPE
Beamforming options for hades_synthesis.
Definition saf_hades_synthesis.h:71

HADES_BEAMFORMER_FILTER_AND_SUM
@ HADES_BEAMFORMER_FILTER_AND_SUM
Filter-and-sum beamforming.
Definition saf_hades_synthesis.h:73

HADES_BEAMFORMER_BMVDR
@ HADES_BEAMFORMER_BMVDR
Binaural minimum-variance distortion- less response (MVDR) beamforming.
Definition saf_hades_synthesis.h:74

HADES_BEAMFORMER_NONE
@ HADES_BEAMFORMER_NONE
No beamforming (ref sensors only)
Definition saf_hades_synthesis.h:72

HADES_HRTF_INTERP_OPTIONS
HADES_HRTF_INTERP_OPTIONS
HRTF interpolation options for hades_synthesis.
Definition saf_hades_synthesis.h:79

hades_analysis_data
Main structure for hades analysis.
Definition saf_hades_internal.h:66

hades_analysis_data::nMics
int nMics
Number of microphones.
Definition saf_hades_internal.h:76

hades_analysis_data::blocksize
int blocksize
Number of samples to process at a time (note that 1 doa and diffuseness estimate is made per block)
Definition saf_hades_internal.h:71

hades_analysis_data::hybridmode
int hybridmode
Optionally, the lowest TF bands may be subdivided to improve low-freq resolution.
Definition saf_hades_internal.h:72

hades_analysis_data::DCM_array
float_complex * DCM_array
Diffuse covariance matrix (computed over all grid directions and weighted); FLAT: nBands x nMics x nM...
Definition saf_hades_internal.h:90

hades_analysis_data::grid_dirs_xyz
float * grid_dirs_xyz
Scanning grid coordinates (unit vectors and only used by grid-based estimators); FLAT: nGrid x 3.
Definition saf_hades_internal.h:98

hades_analysis_data::freqVector
float * freqVector
Centre frequencies; nBands x 1.
Definition saf_hades_internal.h:89

hades_analysis_data::grid_dirs_deg
float * grid_dirs_deg
Array grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:74

hades_analysis_data::hopsize
int hopsize
Filterbank hop size (blocksize must be divisable by this.
Definition saf_hades_internal.h:70

hades_analysis_data::fbOpt
HADES_FILTERBANKS fbOpt
see HADES_FILTERBANKS
Definition saf_hades_internal.h:69

hades_analysis_data::W
float_complex * W
Diffuse integration weighting matrix; FLAT: nGrid x nGrid.
Definition saf_hades_internal.h:99

hades_analysis_data::H_array
float_complex * H_array
Array IRs in the frequency domain; FLAT: nBands x nMics x nDirs.
Definition saf_hades_internal.h:91

hades_analysis_data::nBands
int nBands
Number of frequency bands.
Definition saf_hades_internal.h:86

hades_analysis_data::timeSlots
int timeSlots
Number of time slots.
Definition saf_hades_internal.h:87

hades_analysis_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:75

hades_binaural_config
Binaural configuration struct.
Definition saf_hades_synthesis.h:60

hades_binaural_config::nHRIR
int nHRIR
Number of HRIRs.
Definition saf_hades_synthesis.h:62

hades_binaural_config::hrir_fs
int hrir_fs
HRIR sample rate.
Definition saf_hades_synthesis.h:63

hades_binaural_config::lHRIR
int lHRIR
Length of HRIRs in samples.
Definition saf_hades_synthesis.h:61

hades_binaural_config::hrir_dirs_deg
float * hrir_dirs_deg
HRTF directions in [azimuth elevation] format, in degrees; FLAT: nHRIR x 2.
Definition saf_hades_synthesis.h:66

hades_binaural_config::hrirs
float * hrirs
Matrix of HRIR data; FLAT: nHRIR x NUM_EARS x lHRIR.
Definition saf_hades_synthesis.h:64

hades_param_container_data
Parameter container to store the data from an analyser for one blocksize of audio.
Definition saf_hades_internal.h:169

hades_param_container_data::gains_idx
int * gains_idx
Reproduction direction index per band; nBands x 1.
Definition saf_hades_internal.h:175

hades_param_container_data::doa_idx
int * doa_idx
Beamforming direction index per band; nBands x 1.
Definition saf_hades_internal.h:174

hades_param_container_data::diffuseness
float * diffuseness
Diffuseness value per band; nBands x 1.
Definition saf_hades_internal.h:173

hades_param_container_data::gains_diff
float * gains_diff
Extra diffuse reproduction gain per band (default=1.0f); nBands x 1
Definition saf_hades_internal.h:179

hades_param_container_data::gains_dir
float * gains_dir
Extra direct reproduction gain per band (default=1.0f); nBands x 1
Definition saf_hades_internal.h:178

hades_radial_editor_data
Main structure for hades radial (360degree) gain and direct-to-diffuse ratio editor.
Definition saf_hades_internal.h:184

hades_radial_editor_data::pGrid_dirs_deg
float * pGrid_dirs_deg
Pointer to grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:187

hades_radial_editor_data::pGrid_dirs_xyz
float * pGrid_dirs_xyz
Pointer to grid dirs as Cartesian coordinates of unit length; FLAT: nGrid x 3.
Definition saf_hades_internal.h:188

hades_radial_editor_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:186

hades_radial_editor_data::nBands
int nBands
Number of bands.
Definition saf_hades_internal.h:185

hades_signal_container_data
Signal container to store one block of TF-domain audio data.
Definition saf_hades_internal.h:193

hades_signal_container_data::Cx
CxMic * Cx
NON-time-averaged covariance matrix per band; nBands x .Cx(nMics x nMics)
Definition saf_hades_internal.h:199

hades_signal_container_data::inTF
float_complex *** inTF
Input frame in TF-domain; nBands x nMics x timeSlots.
Definition saf_hades_internal.h:202

hades_synthesis_data
Main structure for hades synthesis.
Definition saf_hades_internal.h:112

hades_synthesis_data::outTD
float ** outTD
output time-domain buffer; NUM_EARS x blocksize
Definition saf_hades_internal.h:164

hades_synthesis_data::hLinSolve
void * hLinSolve
Handle for solving linear equations (Ax=b)
Definition saf_hades_internal.h:150

hades_synthesis_data::blocksize
int blocksize
blocksize in samples
Definition saf_hades_internal.h:129

hades_synthesis_data::hCDF
void * hCDF
Handle for solving the covariance matching problem.
Definition saf_hades_internal.h:151

hades_synthesis_data::M
float_complex ** M
Mixing matrix per band; nBands x FLAT: (NUM_EARS x nMics)
Definition saf_hades_internal.h:160

hades_synthesis_data::synAvgCoeff
float synAvgCoeff
Mixing matrix averaging coefficent [0..1].
Definition saf_hades_internal.h:123

hades_synthesis_data::fbOpt
HADES_FILTERBANKS fbOpt
Filterbank option, see HADES_FILTERBANKS.
Definition saf_hades_internal.h:126

hades_synthesis_data::new_M
float_complex * new_M
New mixing matrix (not yet temporally averaged); FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:159

hades_synthesis_data::nBands
int nBands
Number of bands in the time-frequency transform domain.
Definition saf_hades_internal.h:127

hades_synthesis_data::H_array
float_complex * H_array
Array IRs in the frequency domain; FLAT: nBands x nMics x nGrid.
Definition saf_hades_internal.h:132

hades_synthesis_data::As
float_complex * As
Array steering vector for DoA; FLAT: nMics x 1.
Definition saf_hades_internal.h:152

hades_synthesis_data::eq
float * eq
Gain factor per band; nBands x 1.
Definition saf_hades_internal.h:121

hades_synthesis_data::timeSlots
int timeSlots
Number of time frames in the time-frequency transform domain.
Definition saf_hades_internal.h:135

hades_synthesis_data::H_bin
float_complex * H_bin
To spatialise the source beamformers; FLAT: nBands x NUM_EARS x nGrid.
Definition saf_hades_internal.h:144

hades_synthesis_data::beamOption
HADES_BEAMFORMER_TYPE beamOption
see HADES_BEAMFORMER_TYPE
Definition saf_hades_internal.h:114

hades_synthesis_data::enableCM
int enableCM
Flag: whether the spatial covariance matching is enabled (1) or disabled (0)
Definition saf_hades_internal.h:115

hades_synthesis_data::binConfig
hades_binaural_config * binConfig
Internal copy of user configuration.
Definition saf_hades_internal.h:116

hades_synthesis_data::freqVector
float * freqVector
Frequency vector (band centre frequencies); nBands x 1.
Definition saf_hades_internal.h:136

hades_synthesis_data::grid_dirs_deg
float * grid_dirs_deg
Array grid dirs in degrees; FLAT: nGrid x 2.
Definition saf_hades_internal.h:133

hades_synthesis_data::nGrid
int nGrid
Number of grid/scanning directions.
Definition saf_hades_internal.h:130

hades_synthesis_data::Q
float_complex * Q
Mixing matrix for the direct and diffuse streams combined (based on the diffuseness value); FLAT: NUM...
Definition saf_hades_internal.h:157

hades_synthesis_data::As_r
float_complex * As_r
Array steering vector relative to right reference sensor; FLAT: nMics x 1.
Definition saf_hades_internal.h:154

hades_synthesis_data::diffEQ
float * diffEQ
EQ curve to bring the overall diffuse-field magnitude response of the array to that of the HRTFs inst...
Definition saf_hades_internal.h:146

hades_synthesis_data::hPinv
void * hPinv
Handle for computing the Moore-Penrose pseudo inverse.
Definition saf_hades_internal.h:149

hades_synthesis_data::DCM_array
float_complex * DCM_array
Diffuse coherence matrix for the array; FLAT: nBands x nMics x nMics.
Definition saf_hades_internal.h:137

hades_synthesis_data::hopsize
int hopsize
hopsize in samples
Definition saf_hades_internal.h:128

hades_synthesis_data::Cy
float_complex * Cy
Target binaural spatial covariance matrix; FLAT: NUM_EARS x NUM_EARS.
Definition saf_hades_internal.h:158

hades_synthesis_data::outTF
float_complex *** outTF
nBands x NUM_EARS x timeSlots
Definition saf_hades_internal.h:163

hades_synthesis_data::grid_dirs_xyz
float ** grid_dirs_xyz
Grid dirs as Cartesian coordinates of unit length; nGrid x 3.
Definition saf_hades_internal.h:134

hades_synthesis_data::Q_dir
float_complex * Q_dir
Mixing matrix for the direct stream; FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:156

hades_synthesis_data::DCM_bin_norm
float_complex * DCM_bin_norm
Diffuse coherence matrix for the HRTF set, normalised with 1/trace(DCM_bin); FLAT: nBands x nMics x n...
Definition saf_hades_internal.h:145

hades_synthesis_data::W
float_complex * W
Diffuse integration weighting matrix; FLAT: nGrid x nGrid.
Definition saf_hades_internal.h:138

hades_synthesis_data::Q_diff
float_complex * Q_diff
Mixing matrix for the diffuse stream; FLAT: NUM_EARS x nMics.
Definition saf_hades_internal.h:155

hades_synthesis_data::interpOption
HADES_HRTF_INTERP_OPTIONS interpOption
HRIR interpolation option, see HADES_HRTF_INTERP_OPTIONS.
Definition saf_hades_internal.h:118

hades_synthesis_data::As_l
float_complex * As_l
Array steering vector relative to left reference sensor; FLAT: nMics x 1.
Definition saf_hades_internal.h:153

hades_synthesis_data::refIndices
int refIndices[2]
Indices into [0 nMics-1], defining the reference sensors.
Definition saf_hades_internal.h:117

hades_synthesis_data::hFB_dec
void * hFB_dec
Filterbank handle.
Definition saf_hades_internal.h:141

hades_synthesis_data::nMics
int nMics
Number of microphones.
Definition saf_hades_internal.h:131

hades_synthesis_data::streamBalance
float * streamBalance
Stream balance per band (0:fully diffuse, 1:balanced, 2:fully direct); nBands x 1.
Definition saf_hades_internal.h:122