@incollection{tagging-cattuto, abstract = {{Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Even though most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptions on the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity in terms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures of tag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding is provided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measures of semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of the investigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web - ISWC 2008}, citeulike-article-id = {4718854}, citeulike-linkout-0 = {http://dx.doi.org/10.1007/978-3-540-88564-1\_39}, citeulike-linkout-1 = {http://www.springerlink.com/content/9044260283881v78}, doi = {10.1007/978-3-540-88564-1\_39}, editor = {Sheth, Amit and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy and Thirunarayan, Krishnaprasad}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {022ccb7184fcd0e43092fca13fd56a00}, journal = {The Semantic Web - ISWC 2008}, pages = {615--631}, posted-at = {2011-09-09 20:06:23}, priority = {2}, publisher = {Springer Berlin / Heidelberg}, series = {Lecture Notes in Computer Science}, title = {{Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}}, url = {http://tagora-project.eu/wp-content/2009/09/cattuto_iswc2008.pdf}, volume = 5318, year = 2008 } @inproceedings{atzmueller2011towards, author = {Atzmueller, Martin and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 4th international workshop on Social Data on the Web (SDoW2011)}, editor = {Passant, Alexandre and Fernández, Sergio and Breslin, John and Bojārs, Uldis}, interhash = {65222f0ccc23063a2a15c0a7fd5513a0}, intrahash = {a47a41658592202811f0139d4bb65871}, title = {Towards Mining Semantic Maturity in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/atzmueller2011towards.pdf}, year = 2011 } @inproceedings{cattuto2008semantica, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For taskslike synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008, Proc.Intl. Semantic Web Conference 2008}, doi = {http://dx.doi.org/10.1007/978-3-540-88564-1_39}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, file = {cattuto2008semantica.pdf:cattuto2008semantica.pdf:PDF}, groups = {public}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {27198c985b3bdb6daab0f7e961b370a9}, pages = {615--631}, publisher = {Springer}, series = {LNAI}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/cattuto2008semantica.pdf}, username = {dbenz}, volume = 5318, year = 2008 } @inproceedings{atzmueller2011towards, author = {Atzmueller, Martin and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 4th international workshop on Social Data on the Web (SDoW2011)}, editor = {Passant, Alexandre and Fernández, Sergio and Breslin, John and Bojars, Uldis}, interhash = {65222f0ccc23063a2a15c0a7fd5513a0}, intrahash = {46119d149e72a77972b025899aa3a94f}, title = {Towards Mining Semantic Maturity in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/atzmueller2011towards.pdf}, year = 2011 } @article{hotho2010publikationsmanagement, abstract = {Kooperative Verschlagwortungs- bzw. Social-Bookmarking-Systeme wie Delicious, Mister Wong oder auch unser eigenes System BibSonomy erfreuen sich immer gr{\"o}{\ss}erer Beliebtheit und bilden einen zentralen Bestandteil des heutigen Web 2.0. In solchen Systemen erstellen Nutzer leichtgewichtige Begriffssysteme, sogenannte Folksonomies, die die Nutzerdaten strukturieren. Die einfache Bedienbarkeit, die Allgegenw{\"a}rtigkeit, die st{\"a}ndige Verf{\"u}gbarkeit, aber auch die M{\"o}glichkeit, Gleichgesinnte spontan in solchen Systemen zu entdecken oder sie schlicht als Informationsquelle zu nutzen, sind Gr{\"u}nde f{\"u}r ihren gegenw{\"a}rtigen Erfolg. Der Artikel f{\"u}hrt den Begriff Social Bookmarking ein und diskutiert zentrale Elemente (wie Browsing und Suche) am Beispiel von BibSonomy anhand typischer Arbeitsabl{\"a}ufe eines Wissenschaftlers. Wir beschreiben die Architektur von BibSonomy sowie Wege der Integration und Vernetzung von BibSonomy mit Content-Management-Systemen und Webauftritten. Der Artikel schlie{\ss}t mit Querbez{\"u}gen zu aktuellen Forschungsfragen im Bereich Social Bookmarking.}, author = {Hotho, Andreas and Benz, Dominik and Eisterlehner, Folke and J{\"a}schke, Robert and Krause, Beate and Schmitz, Christoph and Stumme, Gerd}, file = {dpunkt Product page:http\://hmd.dpunkt.de/271/05.html:URL}, interhash = {4555775b639fe1ec65a302a61ee6532c}, intrahash = {250d83c41fb10b89c73f54bd7040bd6e}, issn = {1436-3011}, journal = {HMD -- Praxis der Wirtschaftsinformatik}, month = {#feb#}, pages = {47-58}, title = {{Publikationsmanagement mit BibSonomy -- ein Social-Bookmarking-System f{\"u}r Wissenschaftler}}, volume = {Heft 271}, year = 2010 } @inproceedings{cattuto2008semantic, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web - ISWC 2008}, doi = {10.1007/978-3-540-88564-1_39}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {4752f261d03cead0c52565148a0ba1c9}, isbn = {978-3-540-88563-4}, pages = {615--631}, publisher = {Springer Berlin / Heidelberg}, series = {Lecture Notes in Computer Science}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/cattuto2008semantica.pdf}, volume = 5318, year = 2008 } @inproceedings{cattuto2008semantica, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For taskslike synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008, Proc.Intl. Semantic Web Conference 2008}, doi = {http://dx.doi.org/10.1007/978-3-540-88564-1_39}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, file = {cattuto2008semantica.pdf:cattuto2008semantica.pdf:PDF}, groups = {public}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {27198c985b3bdb6daab0f7e961b370a9}, pages = {615--631}, publisher = {Springer}, series = {LNAI}, timestamp = {2009-09-14 19:12:46}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/cattuto2008semantica.pdf}, username = {dbenz}, volume = 5318, year = 2008 } @inproceedings{koerner2010thinking, abstract = {Recent research provides evidence for the presence of emergent semantics in collaborative tagging systems. While several methods have been proposed, little is known about the factors that influence the evolution of semantic structures in these systems. A natural hypothesis is that the quality of the emergent semantics depends on the pragmatics of tagging: Users with certain usage patterns might contribute more to the resulting semantics than others. In this work, we propose several measures which enable a pragmatic differentiation of taggers by their degree of contribution to emerging semantic structures. We distinguish between categorizers, who typically use a small set of tags as a replacement for hierarchical classification schemes, and describers, who are annotating resources with a wealth of freely associated, descriptive keywords. To study our hypothesis, we apply semantic similarity measures to 64 different partitions of a real-world and large-scale folksonomy containing different ratios of categorizers and describers. Our results not only show that ‘verbose’ taggers are most useful for the emergence of tag semantics, but also that a subset containing only 40% of the most ‘verbose’ taggers can produce results that match and even outperform the semantic precision obtained from the whole dataset. Moreover, the results suggest that there exists a causal link between the pragmatics of tagging and resulting emergent semantics. This work is relevant for designers and analysts of tagging systems interested (i) in fostering the semantic development of their platforms, (ii) in identifying users introducing “semantic noise”, and (iii) in learning ontologies.}, address = {Raleigh, NC, USA}, author = {Körner, Christian and Benz, Dominik and Strohmaier, Markus and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 19th International World Wide Web Conference (WWW 2010)}, interhash = {5afe6e4ce8357d8ac9698060fb438468}, intrahash = {45f8d8f2a8251a5e988c596a5ebb3f2d}, month = apr, publisher = {ACM}, title = {Stop Thinking, start Tagging - Tag Semantics emerge from Collaborative Verbosity}, url = {http://www.kde.cs.uni-kassel.de/benz/papers/2010/koerner2010thinking.pdf}, year = 2010 } @inproceedings{eisterlehner2010visit, address = {Toronto, Canada}, author = {Mitzlaff, Folke and Benz, Dominik and Stumme, Gerd and Hotho, Andreas}, booktitle = {Proceedings of the 21st ACM conference on Hypertext and hypermedia}, interhash = {5584c4c57fcd8eb4663df8b114bcf09c}, intrahash = {a97c4f7e80dcb666450acf697002155e}, title = {Visit me, click me, be my friend: An analysis of evidence networks of user relationships in Bibsonomy}, year = 2010 } @article{hotho2010publikationsmanagement, abstract = {Kooperative Verschlagwortungs- bzw. Social-Bookmarking-Systeme wie Delicious, Mister Wong oder auch unser eigenes System BibSonomy erfreuen sich immer gr{\"o}{\ss}erer Beliebtheit und bilden einen zentralen Bestandteil des heutigen Web 2.0. In solchen Systemen erstellen Nutzer leichtgewichtige Begriffssysteme, sogenannte Folksonomies, die die Nutzerdaten strukturieren. Die einfache Bedienbarkeit, die Allgegenw{\"a}rtigkeit, die st{\"a}ndige Verf{\"u}gbarkeit, aber auch die M{\"o}glichkeit, Gleichgesinnte spontan in solchen Systemen zu entdecken oder sie schlicht als Informationsquelle zu nutzen, sind Gr{\"u}nde f{\"u}r ihren gegenw{\"a}rtigen Erfolg. Der Artikel f{\"u}hrt den Begriff Social Bookmarking ein und diskutiert zentrale Elemente (wie Browsing und Suche) am Beispiel von BibSonomy anhand typischer Arbeitsabl{\"a}ufe eines Wissenschaftlers. Wir beschreiben die Architektur von BibSonomy sowie Wege der Integration und Vernetzung von BibSonomy mit Content-Management-Systemen und Webauftritten. Der Artikel schlie{\ss}t mit Querbez{\"u}gen zu aktuellen Forschungsfragen im Bereich Social Bookmarking.}, author = {Hotho, Andreas and Benz, Dominik and Eisterlehner, Folke and J{\"a}schke, Robert and Krause, Beate and Schmitz, Christoph and Stumme, Gerd}, file = {dpunkt Product page:http\://hmd.dpunkt.de/271/05.html:URL}, interhash = {4555775b639fe1ec65a302a61ee6532c}, intrahash = {250d83c41fb10b89c73f54bd7040bd6e}, issn = {1436-3011}, journal = {HMD -- Praxis der Wirtschaftsinformatik}, month = {#feb#}, pages = {47-58}, title = {{Publikationsmanagement mit BibSonomy -- ein Social-Bookmarking-System f{\"u}r Wissenschaftler}}, volume = {Heft 271}, year = 2010 } @inproceedings{benz2009characterizing, address = {Bled, Slovenia}, author = {Benz, Dominik and Krause, Beate and Kumar, G. Praveen and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 1st Workshop on Explorative Analytics of Information Networks (EIN2009)}, interhash = {de5e58b26200e44112d9791f39e7523d}, intrahash = {b697a98a7340585594455ee2e81d238a}, month = {September}, title = {Characterizing Semantic Relatedness of Search Query Terms}, year = 2009 } @inproceedings{cattuto2008semantic, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008, Proc.Intl. Semantic Web Conference 2008}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {27198c985b3bdb6daab0f7e961b370a9}, pages = {615--631}, publisher = {Springer}, series = {LNAI}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://dx.doi.org/10.1007/978-3-540-88564-1_39}, volume = 5318, year = 2008 } @inproceedings{cattuto08-semantic, abstract = {Social bookmarking systems allow users to organise collections of resources on the Web in a collaborative fashion. The increasing popularity of these systems as well as first insights into their emergent semantics have made them relevant to disciplines like knowledge extraction and ontology learning. The problem of devising methods to measure the semantic relatedness between tags and characterizing it semantically is still largely open. Here we analyze three measures of tag relatedness: tag co-occurrence, cosine similarity of co-occurrence distributions, and FolkRank, an adaptation of the PageRank algorithm to folksonomies. Each measure is computed on tags from a large-scale dataset crawled from the social bookmarking system del.icio.us. To provide a semantic grounding of our findings, a connection to WordNet (a semantic lexicon for the English language) is established by mapping tags into synonym sets of WordNet, and applying there well-known metrics of semantic similarity. Our results clearly expose different characteristics of the selected measures of relatedness, making them applicable to different subtasks of knowledge extraction such as synonym detection or discovery of concept hierarchies.}, address = {Patras, Greece}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 3rd Workshop on Ontology Learning and Population (OLP3)}, interhash = {cc62b733f6e0402db966d6dbf1b7711f}, intrahash = {3b0aca61b24e4343bd80390614e3066e}, month = {July}, title = {Semantic Analysis of Tag Similarity Measures in Collaborative Tagging Systems}, url = {http://olp.dfki.de/olp3/}, year = 2008 } @inproceedings{cattuto2008semantic, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Berlin/Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008}, doi = {10.1007/978-3-540-88564-1_39}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {466f25c93d5e9c13ca5689191ef711ee}, isbn = {978-3-540-88563-4}, pages = {615--631}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://cxnets.googlepages.com/cattuto_iswc2008.pdf}, volume = 5318, year = 2008 } @inproceedings{benz2008analyzing, abstract = {The objective of our group was to exploit state-of-the-art Information Retrieval methods for finding associations and dependencies between tags, capturing and representing differences in tagging behavior and vocabulary of various folksonomies, with the overall aim to better understand the semantics of tags and the tagging process. Therefore we analyze the semantic content of tags in the Flickr and Delicious folksonomies. We find that: tag context similarity leads to meaningful results in Flickr, despite its narrow folksonomy character; the comparison of tags across Flickr and Delicious shows little semantic overlap, being tags in Flickr associated more to visual aspects rather than technological as it seems to be in Delicious; there are regions in the tag-tag space, provided with the cosine similarity metric, that are characterized by high density; the order of tags inside a post has a semantic relevance. }, address = {Dagstuhl, Germany}, author = {Benz, Dominik and Grobelnik, Marko and Hotho, Andreas and Jäschke, Robert and Mladenic, Dunja and Servedio, Vito D. P. and Sizov, Sergej and Szomszor, Martin}, booktitle = {Social Web Communities}, editor = {Alani, Harith and Staab, Steffen and Stumme, Gerd}, interhash = {d738d9d90c1c466ee0a73ac0cc3dc4c1}, intrahash = {7ab57438aa5a68137e46dab8dadd4b2c}, issn = {1862-4405}, number = 08391, publisher = {Schloss Dagstuhl - Leibniz-Zentrum fuer Informatik}, series = {Dagstuhl Seminar Proceedings}, title = {Analyzing Tag Semantics Across Collaborative Tagging Systems}, url = {http://drops.dagstuhl.de/opus/volltexte/2008/1785}, year = 2008 } @inproceedings{benz2008analyzing, abstract = {The objective of our group was to exploit state-of-the-art Information Retrieval methods for finding associations and dependencies between tags, capturing and representing differences in tagging behavior and vocabulary of various folksonomies, with the overall aim to better understand the semantics of tags and the tagging process. Therefore we analyze the semantic content of tags in the Flickr and Delicious folksonomies. We find that: tag context similarity leads to meaningful results in Flickr, despite its narrow folksonomy character; the comparison of tags across Flickr and Delicious shows little semantic overlap, being tags in Flickr associated more to visual aspects rather than technological as it seems to be in Delicious; there are regions in the tag-tag space, provided with the cosine similarity metric, that are characterized by high density; the order of tags inside a post has a semantic relevance. }, address = {Dagstuhl, Germany}, author = {Benz, Dominik and Grobelnik, Marko and Hotho, Andreas and Jäschke, Robert and Mladenic, Dunja and Servedio, Vito D. P. and Sizov, Sergej and Szomszor, Martin}, booktitle = {Social Web Communities}, editor = {Alani, Harith and Staab, Steffen and Stumme, Gerd}, interhash = {d738d9d90c1c466ee0a73ac0cc3dc4c1}, intrahash = {7ab57438aa5a68137e46dab8dadd4b2c}, issn = {1862-4405}, month = sep, number = 08391, publisher = {Schloss Dagstuhl - Leibniz-Zentrum fuer Informatik}, series = {Dagstuhl Seminar Proceedings}, title = {Analyzing Tag Semantics Across Collaborative Tagging Systems}, url = {http://drops.dagstuhl.de/opus/volltexte/2008/1785}, year = 2008 } @inproceedings{cattuto2008semantic, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For tasks like synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Berlin/Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008}, doi = {10.1007/978-3-540-88564-1_39}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {466f25c93d5e9c13ca5689191ef711ee}, isbn = {978-3-540-88563-4}, pages = {615--631}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://cxnets.googlepages.com/cattuto_iswc2008.pdf}, volume = 5318, year = 2008 } @misc{cattuto-2008, abstract = { Social bookmarking systems allow users to organise collections of resources on the Web in a collaborative fashion. The increasing popularity of these systems as well as first insights into their emergent semantics have made them relevant to disciplines like knowledge extraction and ontology learning. The problem of devising methods to measure the semantic relatedness between tags and characterizing it semantically is still largely open. Here we analyze three measures of tag relatedness: tag co-occurrence, cosine similarity of co-occurrence distributions, and FolkRank, an adaptation of the PageRank algorithm to folksonomies. Each measure is computed on tags from a large-scale dataset crawled from the social bookmarking system del.icio.us. To provide a semantic grounding of our findings, a connection to WordNet (a semantic lexicon for the English language) is established by mapping tags into synonym sets of WordNet, and applying there well-known metrics of semantic similarity. Our results clearly expose different characteristics of the selected measures of relatedness, making them applicable to different subtasks of knowledge extraction such as synonym detection or discovery of concept hierarchies.}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, interhash = {cc62b733f6e0402db966d6dbf1b7711f}, intrahash = {78fd64c3db55e6387ebdeb6c40054542}, title = {Semantic Analysis of Tag Similarity Measures in Collaborative Tagging Systems}, url = {http://www.citebase.org/abstract?id=oai:arXiv.org:0805.2045}, year = 2008 }