@inproceedings{benz2010semantics, address = {Raleigh, NC, USA}, author = {Benz, Dominik and Hotho, Andreas and Stützer, Stefan and Stumme, Gerd}, booktitle = {Proceedings of the 2nd Web Science Conference (WebSci10)}, file = {benz2010semantics.pdf:benz2010semantics.pdf:PDF}, interhash = {d4a2f14bb27ce220ba43f651e42aeddc}, intrahash = {16c77e486fb8bc527eb7734b153932ab}, title = {Semantics made by you and me: Self-emerging ontologies can capture the diversity of shared knowledge}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/benz2010semantics.pdf}, year = 2010 } @inproceedings{bade2008evaluation, abstract = {Several learning tasks comprise hierarchies. Comparison with a "goldstandard" is often performed to evaluate the quality of a learned hierarchy. We assembled various similarity metrics that have been proposed in different disciplines and compared them in a unified interdisciplinary framework for hierarchical evaluation which is based on the distinction of three fundamental dimensions. Identifying deficiencies for measuring structural similarity, we suggest three new measures for this purpose, either extending existing ones or based on new ideas. Experiments with an artificial dataset were performed to compare the different measures. As shown by our results, the measures vary greatly in their properties.}, address = {Berlin-Heidelberg}, author = {Bade, Korinna and Benz, Dominik}, booktitle = {Proceedings of the 32nd Annual Conference of the German Classification Society - Advances in Data Analysis, Data Handling and Business Intelligence (GfKl 2008)}, file = {bade2008evaluation.pdf:bade2008evaluation.pdf:PDF}, groups = {public}, interhash = {8bb09e3197d01f7c23481c2cd68533af}, intrahash = {ec033805bc90ab87c99860e29f0d00dd}, note = {in press}, publisher = {Springer}, series = {Studies in Classification, Data Analysis, and Knowledge Organization}, title = {Evaluation Strategies for Learning Algorithms of Hierarchical Structures}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/bade2008evaluation.pdf}, username = {dbenz}, year = 2008 } @inproceedings{benz2007position, abstract = {The emergence of collaborative tagging systems with their underlying flat and uncontrolled resource organization paradigm has led to a large number of research activities focussing on a formal description and analysis of the resulting “folksonomies??. An interesting outcome is that the characteristic qualities of these systems seem to be inverse to more traditional knowledge structuring approaches like taxonomies or ontologies: The latter provide rich and precise semantics, but suffer - amongst others - from a knowledge acquisition bottleneck. An important step towards exploiting the possible synergies by bridging the gap between both paradigms is the automatic extraction of relations between tags in a folksonomy. This position paper presents preliminary results of ongoing work to induce hierarchical relationships among tags by analyzing the aggregated data of collaborative tagging systems as a basis for an ontology learning procedure.}, author = {Benz, Dominik and Hotho, Andreas}, booktitle = {Workshop Proceedings of Lernen - Wissensentdeckung - Adaptivität (LWA 2007)}, editor = {Hinneburg, Alexander}, file = {benz2007position.pdf:benz2007position.pdf:PDF}, groups = {public}, interhash = {ff7de5717f771dabd764675279ff3adf}, intrahash = {72bff5ebe5dfb5023f62ba9b94e6ed01}, isbn = {978-3-86010-907-6}, month = sep, note = {http://lwa07.informatik.uni-halle.de/kdml07/kdml07.htm}, pages = {109--112}, publisher = {Martin-Luther-Universität Halle-Wittenberg}, title = {Position Paper: Ontology Learning from Folksonomies}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/benz2007position.pdf}, username = {dbenz}, year = 2007 } @inproceedings{benz2008analyzing, abstract = {The objective of our group was to exploit state-of-the-art Information Retrieval methods for finding associations and dependencies between tags, capturing and representing differences in tagging behavior and vocabulary of various folksonomies, with the overall aim to better understand the semantics of tags and the tagging process. Therefore we analyze the semantic content of tags in the Flickr and Delicious folksonomies. We find that: tag context similarity leads to meaningful results in Flickr, despite its narrow folksonomy character; the comparison of tags across Flickr and Delicious shows little semantic overlap, being tags in Flickr associated more to visual aspects rather than technological as it seems to be in Delicious; there are regions in the tag-tag space, provided with the cosine similarity metric, that are characterized by high density; the order of tags inside a post has a semantic relevance.}, author = {Benz, Dominik and Grobelnik, Marko and Hotho, Andreas and Jäschke, Robert and Mladenic, Dunja and Servedio, Vito D. P. and Sizov, Sergej and Szomszor, Martin}, booktitle = {Proceedings of the Dagstuhl Seminar on Social Web Communities}, editor = {Alani, Harith and Staab, Steffen and Stumme, Gerd}, file = {benz2008analyzing.pdf:benz2008analyzing.pdf:PDF}, groups = {public}, interhash = {d738d9d90c1c466ee0a73ac0cc3dc4c1}, intrahash = {6918e578527dec96abb5718f105d9f78}, issn = {1862-4405}, number = 08391, title = {Analyzing Tag Semantics Across Collaborative Tagging Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/benz2008analyzing.pdf}, username = {dbenz}, year = 2008 } @inproceedings{benz2009characterizing, address = {Bled, Slovenia}, author = {Benz, Dominik and Krause, Beate and Kumar, G. Praveen and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 1st Workshop on Explorative Analytics of Information Networks (EIN2009)}, file = {benz2009characterizing.pdf:benz2009characterizing.pdf:PDF}, groups = {public}, interhash = {de5e58b26200e44112d9791f39e7523d}, intrahash = {b697a98a7340585594455ee2e81d238a}, month = {September}, title = {Characterizing Semantic Relatedness of Search Query Terms}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/benz2009characterizing.pdf}, username = {dbenz}, year = 2009 } @inproceedings{cattuto2008semantic, abstract = {Social bookmarking systems allow users to organise collections of resources on the Web in a collaborative fashion. The increasing popularity of these systems as well as first insights into their emergent semantics have made them relevant to disciplines like knowledge extraction and ontology learning. The problem of devising methods to measure the semantic relatedness between tags and characterizing it semantically is still largely open. Here we analyze three measures of tag relatedness: tag co-occurrence, cosine similarity of co-occurrence distributions, and FolkRank, an adaptation of the PageRank algorithm to folksonomies. Each measure is computed on tags from a large-scale dataset crawled from the social bookmarking system del.icio.us. To provide a semantic grounding of our findings, a connection to WordNet (a semantic lexicon for the English language) is established by mapping tags into synonym sets of WordNet, and applying there well-known metrics of semantic similarity. Our results clearly expose different characteristics of the selected measures of relatedness, making them applicable to different subtasks of knowledge extraction such as synonym detection or discovery of concept hierarchies.}, address = {Patras, Greece}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 3rd Workshop on Ontology Learning and Population (OLP3)}, file = {cattuto2008semantic.pdf:cattuto2008semantic.pdf:PDF}, groups = {public}, homepage = {http://olp.dfki.de/olp3/}, interhash = {cc62b733f6e0402db966d6dbf1b7711f}, intrahash = {3b0aca61b24e4343bd80390614e3066e}, isbn = {978-960-89282-6-8}, month = {July}, note = {ISBN 978-960-89282-6-8}, pages = {39--43}, title = {Semantic Analysis of Tag Similarity Measures in Collaborative Tagging Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/cattuto2008semantic.pdf}, username = {dbenz}, year = 2008 } @inproceedings{cattuto2008semantica, abstract = {Collaborative tagging systems have nowadays become important data sources for populating semantic web applications. For taskslike synonym detection and discovery of concept hierarchies, many researchers introduced measures of tag similarity. Eventhough most of these measures appear very natural, their design often seems to be rather ad hoc, and the underlying assumptionson the notion of similarity are not made explicit. A more systematic characterization and validation of tag similarity interms of formal representations of knowledge is still lacking. Here we address this issue and analyze several measures oftag similarity: Each measure is computed on data from the social bookmarking system del.icio.us and a semantic grounding isprovided by mapping pairs of similar tags in the folksonomy to pairs of synsets in Wordnet, where we use validated measuresof semantic distance to characterize the semantic relation between the mapped tags. This exposes important features of theinvestigated similarity measures and indicates which ones are better suited in the context of a given semantic application.}, address = {Heidelberg}, author = {Cattuto, Ciro and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {The Semantic Web -- ISWC 2008, Proc.Intl. Semantic Web Conference 2008}, doi = {http://dx.doi.org/10.1007/978-3-540-88564-1_39}, editor = {Sheth, Amit P. and Staab, Steffen and Dean, Mike and Paolucci, Massimo and Maynard, Diana and Finin, Timothy W. and Thirunarayan, Krishnaprasad}, file = {cattuto2008semantica.pdf:cattuto2008semantica.pdf:PDF}, groups = {public}, interhash = {b44538648cfd476d6c94e30bc6626c86}, intrahash = {27198c985b3bdb6daab0f7e961b370a9}, pages = {615--631}, publisher = {Springer}, series = {LNAI}, title = {Semantic Grounding of Tag Relatedness in Social Bookmarking Systems}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/cattuto2008semantica.pdf}, username = {dbenz}, volume = 5318, year = 2008 } @inproceedings{hotho2006emergent, abstract = {Social bookmark tools are rapidly emerging on the Web. In suchsystems users are setting up lightweight conceptual structurescalled folksonomies. The reason for their immediate success is thefact that no specific skills are needed for participating. In thispaper we specify a formal model for folksonomies, briefly describeour own system BibSonomy, which allows for sharing both bookmarks andpublication references, and discuss first steps towards emergent semantics.}, address = {Bonn}, author = {Hotho, Andreas and Jäschke, Robert and Schmitz, Christoph and Stumme, Gerd}, booktitle = {Informatik 2006 -- Informatik für Menschen. Band 2}, editor = {Hochberger, Christian and Liskowsky, Rüdiger}, file = {hotho2006emergent.pdf:hotho2006emergent.pdf:PDF}, groups = {public}, interhash = {53e5677ab0bf1a8f5a635cc32c9082ba}, intrahash = {05043cc20f1e0f5a612135c970e4f1ac}, month = {October}, note = {Proc. Workshop on Applications of Semantic Technologies, Informatik 2006}, publisher = {Gesellschaft für Informatik}, series = {Lecture Notes in Informatics}, title = {Emergent Semantics in BibSonomy}, url = {http://www.kde.cs.uni-kassel.de/stumme/papers/2006/hotho2006emergent.pdf}, username = {dbenz}, volume = {P-94}, year = 2006 } @inproceedings{koerner2010stop, abstract = {Recent research provides evidence for the presence of emergent semantics in collaborative tagging systems. While several methods have been proposed, little is known about the factors that influence the evolution of semantic structures in these systems. A natural hypothesis is that the quality of the emergent semantics depends on the pragmatics of tagging: Users with certain usage patterns might contribute more to the resulting semantics than others. In this work, we propose several measures which enable a pragmatic differentiation of taggers by their degree of contribution to emerging semantic structures. We distinguish between categorizers, who typically use a small set of tags as a replacement for hierarchical classification schemes, and describers, who are annotating resources with a wealth of freely associated, descriptive keywords. To study our hypothesis, we apply semantic similarity measures to 64 different partitions of a real-world and large-scale folksonomy containing different ratios of categorizers and describers. Our results not only show that ‘verbose’ taggers are most useful for the emergence of tag semantics, but also that a subset containing only 40% of the most ‘verbose’ taggers can produce results that match and even outperform the semantic precision obtained from the whole dataset. Moreover, the results suggest that there exists a causal link between the pragmatics of tagging and resulting emergent semantics. This work is relevant for designers and analysts of tagging systems interested (i) in fostering the semantic development of their platforms, (ii) in identifying users introducing “semantic noise??, and (iii) in learning ontologies.}, address = {Raleigh, NC, USA}, author = {Körner, Christian and Benz, Dominik and Strohmaier, Markus and Hotho, Andreas and Stumme, Gerd}, booktitle = {Proceedings of the 19th International World Wide Web Conference (WWW 2010)}, file = {koerner2010stop.pdf:koerner2010stop.pdf:PDF}, groups = {public}, interhash = {5afe6e4ce8357d8ac9698060fb438468}, intrahash = {45f8d8f2a8251a5e988c596a5ebb3f2d}, month = apr, publisher = {ACM}, title = {Stop Thinking, start Tagging - Tag Semantics emerge from Collaborative Verbosity}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/koerner2010stop.pdf}, username = {dbenz}, year = 2010 } @inproceedings{markines2009evaluating, abstract = {Social bookmarking systems and their emergent information structures, known as folksonomies, are increasingly important data sources for Semantic Web applications. A key question for harvesting semantics from these systems is how to extend and adapt traditional notions of similarity to folksonomies, and which measures are best suited for applications such as navigation support, semantic search, and ontology learning. Here we build an evaluation framework to compare various general folksonomy-based similarity measures derived from established information-theoretic, statistical, and practical measures. Our framework deals generally and symmetrically with users, tags, and resources. For evaluation purposes we focus on similarity among tags and resources, considering different ways to aggregate annotations across users. After comparing how tag similarity measures predict user-created tag relations, we provide an external grounding by user-validated semantic proxies based on WordNet and the Open Directory. We also investigate the issue of scalability. We ?nd that mutual information with distributional micro-aggregation across users yields the highest accuracy, but is not scalable; per-user projection with collaborative aggregation provides the best scalable approach via incremental computations. The results are consistent across resource and tag similarity.}, author = {Markines, Benjamin and Cattuto, Ciro and Menczer, Filippo and Benz, Dominik and Hotho, Andreas and Stumme, Gerd}, booktitle = {18th International World Wide Web Conference}, file = {markines2009evaluating.pdf:markines2009evaluating.pdf:PDF}, groups = {public}, interhash = {a266558ad4d83d536a0be2ac94b6b7df}, intrahash = {d16e752a8295d5dad7e26b199d9f614f}, month = {April}, pages = {641--641}, title = {Evaluating Similarity Measures for Emergent Semantics of Social Tagging}, url = {http://www.kde.cs.uni-kassel.de/pub/pdf/markines2009evaluating.pdf}, username = {dbenz}, year = 2009 } @article{levy2008learning, author = {Levy, M. and Sandler, M.}, file = {levy2008learning.pdf:levy2008learning.pdf:PDF}, groups = {public}, interhash = {82ca1eaa0983bf17582b4b02597f2a1d}, intrahash = {0681ab4879e2378295f724eb73e7360c}, journal = {Journal of New Music Research}, number = 2, pages = {137--150}, publisher = {Routledge, part of the Taylor \& Francis Group}, title = {Learning latent semantic models for music from social tags}, username = {dbenz}, volume = 37, year = 2008 } @book{manning1999foundations, address = {Cambridge, MA}, author = {Manning, C. and Sch\"utze, H.}, interhash = {a81df02f92f266a51183fe936f588a08}, intrahash = {e2f05fae5d02f579a85a10b79edf1d99}, publisher = {MIT Press}, title = {Foundations of statistical natural language processing}, year = 1999 } @inproceedings{tatu2010inducing, author = {Tatu, Marta and Moldovan, Dan I.}, booktitle = {LREC}, crossref = {conf/lrec/2010}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Maegaard, Bente and Mariani, Joseph and Odijk, Jan and Piperidis, Stelios and Rosner, Mike and Tapias, Daniel}, ee = {http://www.lrec-conf.org/proceedings/lrec2010/summaries/203.html}, interhash = {df87cca39d1fbe9d12d5441e0be169c5}, intrahash = {deb8d2f57af4373047bcaba2fe67e39e}, isbn = {2-9517408-6-7}, publisher = {European Language Resources Association}, title = {Inducing Ontologies from Folksonomies using Natural Language Understanding.}, url = {http://dblp.uni-trier.de/db/conf/lrec/lrec2010.html#TatuM10}, year = 2010 } @mastersthesis{meder2010multidomain, author = {Meder, Michael}, groups = {public}, interhash = {c344c636c94156ba014c020d9e16b1e5}, intrahash = {7ef2f23103d4c0ed0ad344f9ead8db9d}, school = {Technische Universität Berlin}, timestamp = {2011.07.20}, title = {Multi-Domain Klassifikation basierend auf nutzergenerierten Metadaten}, username = {dbenz}, year = 2010 } @incollection{doush2010integrating, affiliation = {Yarmouk University Dept. Computer Science}, author = {Doush, Iyad Abu and Pontelli, Enrico}, booktitle = {Computers Helping People with Special Needs}, editor = {Miesenberger, Klaus and Klaus, Joachim and Zagler, Wolfgang and Karshmer, Arthur}, interhash = {e05135c7b60b2cfae3165bcf8ff9d1c7}, intrahash = {85c2161e2e6a320699e6fd71bf15393a}, note = {10.1007/978-3-642-14097-6_60}, pages = {376-383}, publisher = {Springer Berlin / Heidelberg}, series = {Lecture Notes in Computer Science}, title = {Integrating Semantic Web and Folksonomies to Improve E-Learning Accessibility}, url = {http://dx.doi.org/10.1007/978-3-642-14097-6_60}, volume = 6179, year = 2010 } @inproceedings{barla2009deriving, author = {Barla, Michal and Bielikov�, M�ria}, booktitle = {Computational Collective Intelligence. Semantic Web, Social Networks and Multiagent System}, editor = {Nguyen, Ngoc Thanh and Kowalczyk, Ryszard and Chen, Shyi-Ming}, interhash = {ff65905d1c79503920fa46c013c2861c}, intrahash = {98c5b4c0cdbc9344773f9867f90a6a3a}, isbn = {978-3-642-04440-3}, pages = {309-320}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {On Deriving Tagsonomies: Keyword Relations Coming from Crowd.}, url = {http://dx.doi.org/10.1007/978-3-642-04441-0_27}, volume = 5796, year = 2009 } @article{dbpedia_jws_09, author = {Lehmann, Jens and Bizer, Chris and Kobilarov, Georgi and Auer, Sören and Becker, Christian and Cyganiak, Richard and Hellmann, Sebastian}, doi = {doi:10.1016/j.websem.2009.07.002}, interhash = {087f766f30469cbc881c83ad156a104a}, intrahash = {f40d3f49ec12638400bdb99a930b4bbc}, journal = {Journal of Web Semantics}, number = 3, pages = {154--165}, title = {{DB}pedia - A Crystallization Point for the Web of Data}, url = {http://jens-lehmann.org/files/2009/dbpedia_jws.pdf}, volume = 7, year = 2009 } @article{weichselbraun2010augmenting, address = {Los Alamitos, CA, USA}, author = {Weichselbraun, Albert and Wohlgenannt, Gerhard and Scharl, Arno}, doi = {10.1109/DEXA.2010.53}, interhash = {c7adb30f1c3e4ba155dd36f76149f0eb}, intrahash = {8e2afcb17621138bf6fac716bbbd5df3}, issn = {1529-4188}, journal = {Database and Expert Systems Applications, International Workshop on}, pages = {193-197}, publisher = {IEEE Computer Society}, title = {Augmenting Lightweight Domain Ontologies with Social Evidence Sources}, url = {http://www.computer.org/portal/web/csdl/doi/10.1109/DEXA.2010.53}, volume = 0, year = 2010 } @incollection{springerlink:10.1007/978-3-540-76298-0_79, abstract = {The use of tags to describe Web resources in a collaborative manner has experienced rising popularity among Web users in recent years. The product of such activity is given the name folksonomy, which can be considered as a scheme of organizing information in the users’ own way. This research work attempts to analyze tripartite graphs – graphs involving users, tags and resources – of folksonomies and discuss how these elements acquire their semantics through their associations with other elements, a process we call mutual contextualization. By studying such process, we try to identify solutions to problems such as tag disambiguation, retrieving documents of similar topics and discovering communities of users. This paper describes the basis of the research work, mentions work done so far and outlines future plans.}, address = {Berlin / Heidelberg}, affiliation = {Intelligence, Agents and Multimedia Group (IAM), School of Electronics and Computer Science, University of Southampton, Southampton SO17 1BJ UK}, author = {man Yeung, Ching and Gibbins, Nicholas and Shadbolt, Nigel}, booktitle = {The Semantic Web}, doi = {10.1007/978-3-540-76298-0_79}, editor = {Aberer, Karl and Choi, Key-Sun and Noy, Natasha and Allemang, Dean and Lee, Kyung-Il and Nixon, Lyndon and Golbeck, Jennifer and Mika, Peter and Maynard, Diana and Mizoguchi, Riichiro and Schreiber, Guus and Cudré-Mauroux, Philippe}, interhash = {739050b87c491e82396f3ad3aa87073e}, intrahash = {ceaf5504144fb6a88ef91853421a7644}, pages = {966-970}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Mutual Contextualization in Tripartite Graphs of Folksonomies}, url = {http://dx.doi.org/10.1007/978-3-540-76298-0_79}, volume = 4825, year = 2007 } @inproceedings{angeletou2008semantically, abstract = {Abstract. While the increasing popularity of folksonomies has lead to a vast quantity of tagged data, resource retrieval in folksonomies is limited by being agnostic to the meaning (i.e., semantics) of tags. Our goal is to automatically enrich folksonomy tags (and implicitly the related resources) with formal semantics by associating them to relevant concepts defined in online ontologies. We introduce FLOR, a method that performs automatic folksonomy enrichment by combining knowledge from WordNet and online available ontologies. Experimentally testing FLOR, we found that it correctly enriched 72 % of 250 Flickr photos. 1}, author = {Angeletou, Sofia and Sabou, Marta and Motta, Enrico}, booktitle = {Proceedings of the CISWeb Workshop, located at the 5th European Semantic Web Conference ESWC 2008}, file = {angeletou2008semantically.pdf:angeletou2008semantically.pdf:PDF}, groups = {public}, institution = {CiteSeerX - Scientific Literature Digital Library and Search Engine [http://citeseerx.ist.psu.edu/oai2] (United States)}, interhash = {1b244d0220730e994822192f6e1cba76}, intrahash = {e6404fa071680b21905ef7f3255359f7}, location = {http://www.scientificcommons.org/47680629}, timestamp = {2011-02-17 10:55:55}, title = {Semantically enriching folksonomies with FLOR}, url = {http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.141.2569}, username = {dbenz}, year = 2008 }