Social bookmarking systems have recently gained interest
among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.
%0 Conference Paper
%1 wetzker2008analyzing
%A Wetzker, Robert
%A Zimmermann, Carsten
%A Bauckhage, Christian
%B Mining Social Data (MSoDa) Workshop Proceedings
%D 2008
%K folksonomy tagging
%P 26-30
%T Analyzing Social Bookmarking Systems: A del.icio.us Cookbook
%U http://robertwetzker.com/wp-content/uploads/2008/06/wetzker_delicious_ecai2008_final.pdf
%X Social bookmarking systems have recently gained interest
among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.
@inproceedings{wetzker2008analyzing,
abstract = {Social bookmarking systems have recently gained interest
among researches in the areas of data mining and web intelligence, as they provide a vast amount of user-generated annotations and reflect the interests of millions of people. In this paper, we discuss our initial findings obtained from analyzing a vast corpus of almost 150 million bookmarks found at del.icio.us. Apart from investigating bookmarking and tagging patterns in this data, we discuss evidence that social bookmarking systems are vulnerable to spamming and hence need to be preprocessed before any insightful analysis can be carried out. We present a method, which limits the influence of spam in social bookmarking analysis and provide conclusions and directions for future research.},
added-at = {2010-08-21T08:36:49.000+0200},
author = {Wetzker, Robert and Zimmermann, Carsten and Bauckhage, Christian},
biburl = {https://www.bibsonomy.org/bibtex/2c71aa17db3959585ed3320dcefe7f39b/deynard},
booktitle = {Mining Social Data (MSoDa) Workshop Proceedings},
interhash = {cdd8d32ba6507335a3b856419afc71c3},
intrahash = {c71aa17db3959585ed3320dcefe7f39b},
keywords = {folksonomy tagging},
month = {July},
organization = {ECAI 2008},
pages = {26-30},
timestamp = {2010-08-21T08:36:50.000+0200},
title = {Analyzing Social Bookmarking Systems: A del.icio.us Cookbook},
url = {http://robertwetzker.com/wp-content/uploads/2008/06/wetzker_delicious_ecai2008_final.pdf},
year = 2008
}