This documentation page applies to an outdated AMT version (1.1.0). Click here for the most recent page.
function [x_feat] = llado2022_binauralfeats(ir_input,stim,fs)
%llado2022_binauralfeats calculates binaural features
% Usage: [x_feat] = llado2022_binauralfeats(ir_input,stim,fs);
%
% Input parameters:
% ir_input : Impulse response according to the following matrix
% dimensions: direction x time x channel/ear
% stim : stimulus
% fs : samplef frequency
%
% Output parameters:
% x_feat : binaural features according to the following matrix
% dimensions: nOutputs x features. Features combine the
% itd values below 1.5 kHz (rows 1-18) and ild values
% over 1 kHz (rows 19-36).
%
% Binaural auditory model based on the example 13.6.2 in: Ville Pulkki and
% Matti Karjalainen. Communication acoustics: an introduction to
% speech, audio and psychoacoustics. John Wiley & Sons, 2015.
%
% Url: http://amtoolbox.org/amt-1.1.0/doc/modelstages/llado2022_binauralfeats.php
% Copyright (C) 2009-2021 Piotr Majdak, Clara Hollomey, and the AMT team.
% This file is part of Auditory Modeling Toolbox (AMT) version 1.1.0
%
% This program is free software: you can redistribute it and/or modify
% it under the terms of the GNU General Public License as published by
% the Free Software Foundation, either version 3 of the License, or
% (at your option) any later version.
%
% This program is distributed in the hope that it will be useful,
% but WITHOUT ANY WARRANTY; without even the implied warranty of
% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
% GNU General Public License for more details.
%
% You should have received a copy of the GNU General Public License
% along with this program. If not, see <http://www.gnu.org/licenses/>.
if(ndims(ir_input) == 3)
nIRs = length(ir_input(:,1,1));
ir = ir_input;
else
if(ismatrix(ir_input) == 1)
nIRs = 1;
ir(1,:,:) = ir_input;
else
disp("Wrong input");
end
end
%% USING AMTOOLBOX FOR GAMMA TONE MODEL %%%%%
%create of a gammatone filter bank using the AMT function
%(http://amtoolbox.sourceforge.net)
%
for n_ir = 1:nIRs
%convolution: stimulus - hrirs
insig = [conv(stim,ir(n_ir,:,1)) conv(stim,ir(n_ir,:,2))];
%some parameters for auditory model
fLow = 50;%the lowest characteristic frequency of the filter bank
fHigh = 8000;%and the highest
fCut = 1000; % cut-off frequency of the low-pass filter
maxLag= floor(0.00067*fs); % IACC-values are computed within-1...1 ms
%FILTERS CHARACTERISTIC FREQUENCIES
cfs = erbspacebw(fLow,fHigh); %charact. frequencies of the filter bank
[b,a] = gammatone(cfs,fs,'complex');
%'complex' Generate filter modulated by exponential functions
% b,a: nominator,denominator coefficients
%% Windowing init
% Determine length of input signal
nSamples = size(insig,1);
% Block parameter
blockSec = 20e-3; % Block size in seconds
hopSec = 10e-3; % Step size in seconds
% Block processing parameters
blockSamples = 2 * round(fs * blockSec / 2);
hopSamples = 2 * round(fs * hopSec / 2);
overSamples = blockSamples - hopSamples;
%Haning Window
w = hann(blockSamples);
% Calculate number of frames
nFrames = fix((nSamples-overSamples)/hopSamples);
for i = 1 : nFrames
%GENERATING FILTERS (UFILTERBANKZ) AND FILTERING THE INDIVIDUAL SIGNALS
%processing the signal through the filter bank
filterOut(i).left=2*real(ufilterbankz(b,a,insig((i-1)*hopSamples+1:...
(i-1)*hopSamples+blockSamples,1)));
filterOut(i).right=2*real(ufilterbankz(b,a,insig((i-1)*hopSamples+1:...
(i-1)*hopSamples+blockSamples,2)));
%%%%%EMULATION OF THE NEURAL TRANSDUCTION with :
% 1) half-wave rectification and
rectified(i).left = filterOut(i).left.*(filterOut(i).left>0);
rectified(i).right = filterOut(i).right.*(filterOut(i).right>0);
% 2) low-pass filtering of the filter bank output
%a first-order IIR filter is used as the low-pass filter
beta = exp(-fCut/fs);
outSig(i).left = filter(1-beta,[1 -beta],rectified(i).left);
outSig(i).right = filter(1-beta,[1 -beta],rectified(i).right);
%%%%%COMPUTE INTERAURAL CROSS-CORRELATION AT EACH FREQ BAND
iaccFuncts = zeros(2*maxLag+1,length(cfs));
lagValues = (-maxLag:maxLag)./fs;% vector of lags at fs from min to max
for freqInd=1:length(cfs)
iaccFuncts(:,freqInd) = xcorr(outSig(i).left(:,freqInd),...
outSig(i).right(:,freqInd),maxLag,'coeff'); %COEFF:
%Normalizes the sequence so that the
%autocorrelations at zero lag equal 1
end
%%%%%COMPUTE ITD FOR EACH FREQ BAND
[~,lag] = max(iaccFuncts);
itdEst(i,:) = lagValues(lag); % Time corresponding to lag displacement
%%%%%COMPUTE ILD FOR EACH FREQ BAND
ildEst(i,:) = dbspl(outSig(i).right(:,:))-dbspl(outSig(i).left(:,:));
%% Store binaural faetures for the next stage of the model
end
itdild_feat(n_ir,4:35) = mean(itdEst(:,1:end));
itdild_feat(n_ir,36:67) = mean(ildEst(:,1:end));
%%%%%
end
x_feat = [itdild_feat(:,4:21)';itdild_feat(:,50:end)']; % Use ITD below 1.5 kHz and ILD over 1 kHz
end