Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks
like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.
%0 Conference Paper
%1 cattuto2008semantic
%A Cattuto, Ciro
%A Benz, Dominik
%A Hotho, Andreas
%A Stumme, Gerd
%B The Semantic Web -- ISWC 2008
%C Berlin/Heidelberg
%D 2008
%E Sheth, Amit P.
%E Staab, Steffen
%E Dean, Mike
%E Paolucci, Massimo
%E Maynard, Diana
%E Finin, Timothy W.
%E Thirunarayan, Krishnaprasad
%I Springer
%K evaluation master measures similarity toVerify wordnet
%P 615--631
%R 10.1007/978-3-540-88564-1_39
%T Semantic Grounding of Tag Relatedness in Social Bookmarking Systems
%U http://cxnets.googlepages.com/cattuto_iswc2008.pdf
%V 5318
%X Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks
like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.
%@ 978-3-540-88563-4
@inproceedings{cattuto2008semantic,
abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks
like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.},
added-at = {2010-06-03T10:20:42.000+0200},
address = {Berlin/Heidelberg},
author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd},
biburl = {https://www.bibsonomy.org/bibtex/2466f25c93d5e9c13ca5689191ef711ee/ans},
booktitle = {The Semantic Web -- ISWC 2008},
doi = {10.1007/978-3-540-88564-1_39},
editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad},
interhash = {b44538648cfd476d6c94e30bc6626c86},
intrahash = {466f25c93d5e9c13ca5689191ef711ee},
isbn = {978-3-540-88563-4},
keywords = {evaluation master measures similarity toVerify wordnet},
pages = {615--631},
publisher = {Springer},
series = {Lecture Notes in Computer Science},
timestamp = {2011-03-22T23:02:17.000+0100},
title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems},
url = {http://cxnets.googlepages.com/cattuto_iswc2008.pdf},
volume = 5318,
year = 2008
}