@inbook{bbbdb54c0d5147519d04314dec9dcb2e,
title = "Comparison of distance measures for graph-based clustering of documents",
abstract = "In this paper we describe work relating to clustering of document collections. We compare the conventional vector-model approach using cosine similarity and Euclidean distance to a novel method we have developed for clustering graph-based data with the standard k-means algorithm. The proposed method is evaluated using five different graph distance measures under three clustering performance indices. The experiments are performed on two separate document collections. The results show the graph-based approach performs as well as vector-based methods or even better when using normalized graph distance measures.",
author = "Adam Schenker and Mark Last and Horst Bunke and Abraham Kandel",
year = "2003",
month = jan,
day = "1",
doi = "10.1007/3-540-45028-9_18",
language = "English",
isbn = "354040452X",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "202--213",
editor = "Edwin Hancock and Mario Vento",
booktitle = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
address = "Germany",
}