@inproceedings{811708f1dc3a4f958ef97a446e991746,
title = "What's in a hashtag? Content based prediction of the spread of ideas in microblogging communities",
abstract = "Current social media research mainly focuses on temporal trends of the information ow and on the topology of the social graph that facilitates the propagation of information. In this paper we study the effect of the content of the idea on the information propagation. We present an efficient hybrid approach based on a linear regression for predicting the spread of an idea in a given time frame. We show that a combination of content features with temporal and topological features minimizes prediction error. Our algorithm is evaluated on Twitter hashtags extracted from a dataset of more than 400 million tweets. We analyze the contribution and the limitations of the various feature types to the spread of information, demonstrating that content aspects can be used as strong predictors thus should not be disregarded. We also study the dependencies between global features such as graph topology and content features.",
keywords = "Hashtags, Information diffusion, Microblogging, Social media, Twitter",
author = "Oren Tsur and Ari Rappoport",
year = "2012",
month = mar,
day = "15",
doi = "10.1145/2124295.2124320",
language = "English",
isbn = "9781450307475",
series = "WSDM 2012 - Proceedings of the 5th ACM International Conference on Web Search and Data Mining",
pages = "643--652",
booktitle = "WSDM 2012 - Proceedings of the 5th ACM International Conference on Web Search and Data Mining",
note = "5th ACM International Conference on Web Search and Data Mining, WSDM 2012 ; Conference date: 08-02-2012 Through 12-02-2012",
}