@inproceedings{e2ce75c04a8a4d1e8ee64cacbe2729b2,
title = "An Improved MapReduce Algorithm for Mining Closed Frequent Itemsets",
abstract = "Mining closed frequent item sets is a key objective in the field of data mining due to its wide range of applications. Given a database of transactions, the task is to find closed subsets which appear frequently in different transactions. This subject has been studied thoroughly, and many efficient algorithms had been presented, however, most of them were designed for a non-distributed setting. The exponential growth of data in current times forces storing it in a distributed setting, meaning that most algorithms no longer apply. MapReduce is an acclaimed programming paradigm for processing large-scale, distributed data. In this paper we present an efficient algorithm for mining closed frequent item sets using the MapReduce paradigm. In addition to its novelty of running in a distributed setting, it also makes the duplication elimination step - a common step to all existing algorithms - redundant.",
keywords = "closed itemsets, data mining, frequent itemsets",
author = "Yaron Gonen and Ehud Gudes",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 2016 IEEE International Conference on Software Science, Technology and Engineering, SwSTE 2016 ; Conference date: 23-06-2016 Through 24-06-2016",
year = "2016",
month = jul,
day = "18",
doi = "10.1109/SWSTE.2016.19",
language = "English",
series = "Proceedings - 2016 IEEE International Conference on Software Science, Technology and Engineering, SwSTE 2016",
publisher = "Institute of Electrical and Electronics Engineers",
pages = "77--83",
booktitle = "Proceedings - 2016 IEEE International Conference on Software Science, Technology and Engineering, SwSTE 2016",
address = "United States",
}