@inproceedings{6caf3ed53f69409693acafda433fa928,
title = "Randomization effect on iterative-based speaker diarization system for telephone conversations",
abstract = "The primary objective of speaker diarization system is to designate speech segments to one of K speakers in the conversation. We use a hidden-distortion-model (HDM)-based system. HDM allows using different emission models as speaker models. We investigate the effect of randomization in two different levels. One level is stochastic training versus deterministic training and the other, random model initialization versus preserving initialization from the previous iteration. The emission models were codebooks (CBs) trained using K-means algorithm, both, batch and stochastic versions, as well as a self-organizing map (SOM) in its stochastic version. The evaluation performed on 108 telephone conversations from the LDC CallHome corpus. We will show that randomizing is always outperforming the deterministic training. Stochastic training demonstrated relative improvement of 3.5\%. Random initialization achieved relative improvement of 7.28\% comparing to preservation of initialization from the previous iteration.",
keywords = "Hidden-distortion model (HDM), Initialization, K-means, Self-organizing maps (SOM), Speaker diarization",
author = "Tal Furmanov and Lidiya Aminov and Ami Moyal and Itshak Lapidot",
note = "Publisher Copyright: {\textcopyright} Copyright 2015 IEEE All rights reserved.; 2014 28th IEEE Convention of Electrical and Electronics Engineers in Israel, IEEEI 2014 ; Conference date: 03-12-2014 Through 05-12-2014",
year = "2014",
month = jan,
day = "1",
doi = "10.1109/EEEI.2014.7005738",
language = "English",
series = "2014 IEEE 28th Convention of Electrical and Electronics Engineers in Israel, IEEEI 2014",
publisher = "Institute of Electrical and Electronics Engineers",
booktitle = "2014 IEEE 28th Convention of Electrical and Electronics Engineers in Israel, IEEEI 2014",
address = "United States",
}