@inproceedings{e41c843df7be46e58d2c9a6a34bd5d05,
title = "Speakers clustering with stochastic VQ and clustering quality estimator",
abstract = "Short segments speaker clustering has significant importance both for diarization and applications such as short push-To-Tatk (PTT) segments clustering. In this paper we present a new way to cluster speech segments by applying a stochastic vector quantization (VQ) with a cosine metric together with a speaker clustering quality estimator based on logistic regression. The VQ is performed on codebooks of different sizes, and the choice of the best clustering result is estimated using logistic regression. The algorithm is tested on a large range of speakers, between 2 to 60. The results are compared to those of the mean-shift clustering method, which was already tested for this task several times. The results are a bit below those of the cosine similarity measure-based mean-shift clustering. The advantage is in the run-Time which is approximately 10 times faster.",
keywords = "clustering quality estimation, cosine metric, logistic regression, mean-shift, speaker clustering, vector quantization (VQ)",
author = "Yishai Cohen and Itshak Lapidot",
note = "Publisher Copyright: {\textcopyright} 2018 IEEE.; 2018 IEEE International Conference on the Science of Electrical Engineering in Israel, ICSEE 2018 ; Conference date: 12-12-2018 Through 14-12-2018",
year = "2018",
month = jul,
day = "2",
doi = "10.1109/ICSEE.2018.8646099",
language = "English",
series = "2018 IEEE International Conference on the Science of Electrical Engineering in Israel, ICSEE 2018",
publisher = "Institute of Electrical and Electronics Engineers",
booktitle = "2018 IEEE International Conference on the Science of Electrical Engineering in Israel, ICSEE 2018",
address = "United States",
}