Gaussian Power flow Orientation Coefficients for noise-robust speech recognition. Gerazov, B. & Ivanovski, Z. In 2014 22nd European Signal Processing Conference (EUSIPCO), pages 1467-1471, Sep., 2014. Paper abstract bibtex Spectro-temporal features have shown a great promise in respect to improving the noise-robustness of Automatic Speech Recognition (ASR) systems. The common approach uses a bank of 2D Gabor filters to process the speech signal spectrogram and generate the output feature vector. This approach suffers from generating a large number of coefficients, thus necessitating the use of feature dimensionality reduction. The proposed Gaussian Power flow Orientation Coefficients (GPOCs) use an alternative approach in which only the largest coefficients output from a bank of 2D Gaussian kernels are used to describe the spectro-temporal patterns of power flow in the auditory spectrogram. Whilst reducing the size of the feature vectors, the algorithm was shown to outperform traditional feature extraction methods, even a reference spectro-temporal approach, for low SNRs. Its performance for high SNRs is comparable but inferior to traditional ASR frontends, while falling behind state-of-the-art algorithms in all noise scenarios.
@InProceedings{6952533,
author = {B. Gerazov and Z. Ivanovski},
booktitle = {2014 22nd European Signal Processing Conference (EUSIPCO)},
title = {Gaussian Power flow Orientation Coefficients for noise-robust speech recognition},
year = {2014},
pages = {1467-1471},
abstract = {Spectro-temporal features have shown a great promise in respect to improving the noise-robustness of Automatic Speech Recognition (ASR) systems. The common approach uses a bank of 2D Gabor filters to process the speech signal spectrogram and generate the output feature vector. This approach suffers from generating a large number of coefficients, thus necessitating the use of feature dimensionality reduction. The proposed Gaussian Power flow Orientation Coefficients (GPOCs) use an alternative approach in which only the largest coefficients output from a bank of 2D Gaussian kernels are used to describe the spectro-temporal patterns of power flow in the auditory spectrogram. Whilst reducing the size of the feature vectors, the algorithm was shown to outperform traditional feature extraction methods, even a reference spectro-temporal approach, for low SNRs. Its performance for high SNRs is comparable but inferior to traditional ASR frontends, while falling behind state-of-the-art algorithms in all noise scenarios.},
keywords = {channel bank filters;feature extraction;Gabor filters;Gaussian processes;speech recognition;Gaussian power flow orientation coefficients;noise-robust speech recognition;spectro-temporal features;automatic speech recognition systems;ASR system;2D Gabor filter bank;speech signal spectrogram processing;output feature vector generation;feature dimensionality reduction;GPOCs;2D Gaussian kernel bank;auditory spectrogram;feature vector size reduction;feature extraction methods;reference spectro-temporal approach;SNRs;ASR frontends;Spectrogram;Kernel;Feature extraction;Load flow;Speech;Training;Gabor filters;ASR;noise-robust;spectro-temporal;2D Gaussian;kernel},
issn = {2076-1465},
month = {Sep.},
url = {https://www.eurasip.org/proceedings/eusipco/eusipco2014/html/papers/1569921711.pdf},
}
Downloads: 0
{"_id":"LrbgG5aP3cH8v5JAd","bibbaseid":"gerazov-ivanovski-gaussianpowerfloworientationcoefficientsfornoiserobustspeechrecognition-2014","authorIDs":[],"author_short":["Gerazov, B.","Ivanovski, Z."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["B."],"propositions":[],"lastnames":["Gerazov"],"suffixes":[]},{"firstnames":["Z."],"propositions":[],"lastnames":["Ivanovski"],"suffixes":[]}],"booktitle":"2014 22nd European Signal Processing Conference (EUSIPCO)","title":"Gaussian Power flow Orientation Coefficients for noise-robust speech recognition","year":"2014","pages":"1467-1471","abstract":"Spectro-temporal features have shown a great promise in respect to improving the noise-robustness of Automatic Speech Recognition (ASR) systems. The common approach uses a bank of 2D Gabor filters to process the speech signal spectrogram and generate the output feature vector. This approach suffers from generating a large number of coefficients, thus necessitating the use of feature dimensionality reduction. The proposed Gaussian Power flow Orientation Coefficients (GPOCs) use an alternative approach in which only the largest coefficients output from a bank of 2D Gaussian kernels are used to describe the spectro-temporal patterns of power flow in the auditory spectrogram. Whilst reducing the size of the feature vectors, the algorithm was shown to outperform traditional feature extraction methods, even a reference spectro-temporal approach, for low SNRs. Its performance for high SNRs is comparable but inferior to traditional ASR frontends, while falling behind state-of-the-art algorithms in all noise scenarios.","keywords":"channel bank filters;feature extraction;Gabor filters;Gaussian processes;speech recognition;Gaussian power flow orientation coefficients;noise-robust speech recognition;spectro-temporal features;automatic speech recognition systems;ASR system;2D Gabor filter bank;speech signal spectrogram processing;output feature vector generation;feature dimensionality reduction;GPOCs;2D Gaussian kernel bank;auditory spectrogram;feature vector size reduction;feature extraction methods;reference spectro-temporal approach;SNRs;ASR frontends;Spectrogram;Kernel;Feature extraction;Load flow;Speech;Training;Gabor filters;ASR;noise-robust;spectro-temporal;2D Gaussian;kernel","issn":"2076-1465","month":"Sep.","url":"https://www.eurasip.org/proceedings/eusipco/eusipco2014/html/papers/1569921711.pdf","bibtex":"@InProceedings{6952533,\n author = {B. Gerazov and Z. Ivanovski},\n booktitle = {2014 22nd European Signal Processing Conference (EUSIPCO)},\n title = {Gaussian Power flow Orientation Coefficients for noise-robust speech recognition},\n year = {2014},\n pages = {1467-1471},\n abstract = {Spectro-temporal features have shown a great promise in respect to improving the noise-robustness of Automatic Speech Recognition (ASR) systems. The common approach uses a bank of 2D Gabor filters to process the speech signal spectrogram and generate the output feature vector. This approach suffers from generating a large number of coefficients, thus necessitating the use of feature dimensionality reduction. The proposed Gaussian Power flow Orientation Coefficients (GPOCs) use an alternative approach in which only the largest coefficients output from a bank of 2D Gaussian kernels are used to describe the spectro-temporal patterns of power flow in the auditory spectrogram. Whilst reducing the size of the feature vectors, the algorithm was shown to outperform traditional feature extraction methods, even a reference spectro-temporal approach, for low SNRs. Its performance for high SNRs is comparable but inferior to traditional ASR frontends, while falling behind state-of-the-art algorithms in all noise scenarios.},\n keywords = {channel bank filters;feature extraction;Gabor filters;Gaussian processes;speech recognition;Gaussian power flow orientation coefficients;noise-robust speech recognition;spectro-temporal features;automatic speech recognition systems;ASR system;2D Gabor filter bank;speech signal spectrogram processing;output feature vector generation;feature dimensionality reduction;GPOCs;2D Gaussian kernel bank;auditory spectrogram;feature vector size reduction;feature extraction methods;reference spectro-temporal approach;SNRs;ASR frontends;Spectrogram;Kernel;Feature extraction;Load flow;Speech;Training;Gabor filters;ASR;noise-robust;spectro-temporal;2D Gaussian;kernel},\n issn = {2076-1465},\n month = {Sep.},\n url = {https://www.eurasip.org/proceedings/eusipco/eusipco2014/html/papers/1569921711.pdf},\n}\n\n","author_short":["Gerazov, B.","Ivanovski, Z."],"key":"6952533","id":"6952533","bibbaseid":"gerazov-ivanovski-gaussianpowerfloworientationcoefficientsfornoiserobustspeechrecognition-2014","role":"author","urls":{"Paper":"https://www.eurasip.org/proceedings/eusipco/eusipco2014/html/papers/1569921711.pdf"},"keyword":["channel bank filters;feature extraction;Gabor filters;Gaussian processes;speech recognition;Gaussian power flow orientation coefficients;noise-robust speech recognition;spectro-temporal features;automatic speech recognition systems;ASR system;2D Gabor filter bank;speech signal spectrogram processing;output feature vector generation;feature dimensionality reduction;GPOCs;2D Gaussian kernel bank;auditory spectrogram;feature vector size reduction;feature extraction methods;reference spectro-temporal approach;SNRs;ASR frontends;Spectrogram;Kernel;Feature extraction;Load flow;Speech;Training;Gabor filters;ASR;noise-robust;spectro-temporal;2D Gaussian;kernel"],"metadata":{"authorlinks":{}},"downloads":0},"bibtype":"inproceedings","biburl":"https://raw.githubusercontent.com/Roznn/EUSIPCO/main/eusipco2014url.bib","creationDate":"2021-02-13T17:43:41.694Z","downloads":0,"keywords":["channel bank filters;feature extraction;gabor filters;gaussian processes;speech recognition;gaussian power flow orientation coefficients;noise-robust speech recognition;spectro-temporal features;automatic speech recognition systems;asr system;2d gabor filter bank;speech signal spectrogram processing;output feature vector generation;feature dimensionality reduction;gpocs;2d gaussian kernel bank;auditory spectrogram;feature vector size reduction;feature extraction methods;reference spectro-temporal approach;snrs;asr frontends;spectrogram;kernel;feature extraction;load flow;speech;training;gabor filters;asr;noise-robust;spectro-temporal;2d gaussian;kernel"],"search_terms":["gaussian","power","flow","orientation","coefficients","noise","robust","speech","recognition","gerazov","ivanovski"],"title":"Gaussian Power flow Orientation Coefficients for noise-robust speech recognition","year":2014,"dataSources":["A2ezyFL6GG6na7bbs","oZFG3eQZPXnykPgnE"]}