Social bookmarking systems have recently gained interest among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.
%0 Conference Paper
%1 wetzker2008analyzing
%A Wetzker, Robert
%A Zimmermann, Carsten
%A Bauckhage, Christian
%B In Proceedings of the ECAI 2008 Mining Social Data Workshop (2008)
%D 2008
%K analyzing bookmarking delicious mt social
%P 26-30
%T Analyzing Social Bookmarking Systems: A del.icio.us Cookbook
%X Social bookmarking systems have recently gained interest among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.
@inproceedings{wetzker2008analyzing,
abstract = {Social bookmarking systems have recently gained interest among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.},
added-at = {2009-11-24T09:34:23.000+0100},
author = {Wetzker, Robert and Zimmermann, Carsten and Bauckhage, Christian},
biburl = {https://www.bibsonomy.org/bibtex/23e7e46b40aa77f08c2d985ed49c4d60e/ghp09},
booktitle = {In Proceedings of the ECAI 2008 Mining Social Data Workshop (2008)},
interhash = {cdd8d32ba6507335a3b856419afc71c3},
intrahash = {3e7e46b40aa77f08c2d985ed49c4d60e},
keywords = {analyzing bookmarking delicious mt social},
pages = {26-30},
timestamp = {2009-11-24T09:34:23.000+0100},
title = {Analyzing Social Bookmarking Systems: A del.icio.us Cookbook },
year = 2008
}