@inproceedings{083a677bfe854418b766b26766689f32,
title = "Improving speaker detection in multi-speaker utterances through automatic purification of training data",
abstract = "This article is concerned with automatic purification of data used in training statistical models for automatic speaker detection. It is assumed that the available data for training a model for detecting a particular speaker of interest (SOI) is contaminated by utterances from at least one other speaker. Our approach consists of three steps: (1) build a Gaussian mixture model (GMM) for the SOI, training on the contaminated training files; (2) score consecutive segments of these training files with this GMM; (3) build a new purified GMM from highest scoring segments. We apply our method to a set of SOIs from the Switch-Board I corpus (using summed conversation sides), and show that the purified GMMs are significantly more accurate than the contaminated GMMs for detecting the presence of the SOIs in test data known to contain multi-speaker utterances. This evaluation is text-independent, and no assumptions about the identity or relationship of the non-SOIs in the training and testing data are made.",
keywords = "Gaussian mixture models, ROC curves, Score normalization, Speaker detection, Speech processing, Training data purification",
author = "Smith, {David C.} and Dan Richman",
year = "2003",
language = "English",
isbn = "0889863512",
series = "Proceedings of the IASTED International Conference on Circuits, Signals, and Systems",
pages = "269--274",
editor = "M.H. Rashid and M.H. Rashid",
booktitle = "Proceedings of the IASTED International Conference on Circuits, Signals, and Systems",
note = "null ; Conference date: 19-05-2003 Through 21-05-2003",
}