@inproceedings{727d018e4a2d43db81c1ad0ca8482bee,
title = "Factor analysis based spatial correlation modeling for speaker verification",
abstract = "Gaussian mixture models (GMMs) are commonly used in text-independent speaker verification for modeling the spectral distribution of speech. Recent studies have shown the effectiveness of characterizing speaker information using the mean super-vector obtained by concatenating the mean vectors of the GMM. This paper proposes to use the spatial correlation captured by the covariance matrix of the mean super-vector for speaker verification. Factor analysis method is adopted to estimate the covariance of the super-vector. For measuring the similarity between speech utterances in terms of the spatial correlation, we propose two kernel metrics, namely, log-Euclidean inner product and Frobenius angle. For computational simplicity, we introduce an inner product classifier (IPC) with equivalent performance compared to the commonly used support vector machine (SVM). Experiments conducted on the 2006 NIST speaker recognition evaluation (SRE) dataset confirm the efficacy of the proposed factor analysis based spatial modeling technique.",
keywords = "Factor analysis, Frobenius angle, Inner product classifier, Log-Euclidean distance",
author = "Wang, {Er Yu} and Wu Guo and Dai, {Li Rong} and Lee, {Kong Aik} and Bin Ma and Li, {Hai Zhou}",
year = "2010",
month = jan,
doi = "10.1109/ISCSLP.2010.5684490",
language = "English",
isbn = "9781424462469",
series = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 - Proceedings",
pages = "166--170",
booktitle = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 - Proceedings",
note = "2010 7th International Symposium on Chinese Spoken Language Processing, ISCSLP 2010 ; Conference date: 29-11-2010 Through 03-12-2010",
}