@inproceedings{db9551822e57497babdd147cf0985cd3,
title = "Spectro-temporal smoothed auditory spectra for robust speaker identification",
abstract = "The performance of conventional speaker identification systems is severely compromised by interference, such as additive or convolutional noises. High-level information of the speaker provides more robust cues for identifying speakers. This paper proposes an auditory-model based spectro-temporal modulation filtering (STMF) process to capture high-level information for robust speaker identification. Text-independent closed-set speaker identification simulations are conducted on TIMIT and GRID corpora to evaluate the robustness of Auditory Cepstral Coefficients (ACCs) after the STMF process. Simulation results show ACCs' substantial improvement over conventional MFCCs in all SNR conditions. The superior noise-suppression performance of STMF to newly developed Auditory-based Nonnegative Tensor Cepstral Coefficients (ANTCCs) is also demonstrated in low SNR conditions.",
keywords = "Auditory feature, Gaussian mixture model, Speaker identification, Spectro-temporal modulation",
author = "Lin, {Ting H.} and Hsu, {Chung Chien} and Tai-Shih Chi",
year = "2010",
doi = "10.1109/ISCSLP.2010.5684884",
language = "English",
isbn = "9781424462469",
series = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 - Proceedings",
pages = "313--317",
booktitle = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 - Proceedings",
note = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 ; Conference date: 29-11-2010 Through 03-12-2010",
}