@techreport{limpens2009linking, abstract = {Social tagging systems have recently become very popular as a means to classify large sets of resources shared among on-line communities over the social Web. However, the folksonomies resulting from the use of these systems revealed limitations: tags are ambiguous and their spelling may vary, and folksonomies are difficult to exploit in order to retrieve or exchange information. This report compares the recent attempts to overcome these limitations and to support the use of folksonomies with formal languages and ontologies from the Semantic Web.}, author = {Limpens, Freddy and Gandon, Fabien and Buffa, Michel}, institution = {INRIA, Institut National de Recherche en Informatique et Automatique}, interhash = {79fd59c735eed6708c0a3ca8db23636e}, intrahash = {db2ce0827f852bd879eef886b491a4ec}, month = {july}, title = {Linking Folksonomies and Ontologies for Supporting Knowledge Sharing: a State of the Art}, url = {http://isicil.inria.fr/docs/Livrables/ISICIL-ANR-EA01-FolksonomiesOntologies-0906.pdf}, year = 2009 } @article{garciasilva2011review, abstract = {This paper describes and compares the most relevant approaches for associating tags with semantics in order to make explicit the meaning of those tags. We identify a common set of steps that are usually considered across all these approaches and frame our descriptions according to them, providing a unified view of how each approach tackles the different problems that appear during the semantic association process. Furthermore, we provide some recommendations on (a) how and when to use each of the approaches according to the characteristics of the data source, and (b) how to improve results by leveraging the strengths of the different approaches.}, author = {Garcia-Silva, Andres and Corcho, Oscar and Alani, Harith and Gomez-Perez, Asuncion}, file = {garciasilva2011review.pdf:garciasilva2011review.pdf:PDF}, groups = {public}, interhash = {ef913839d8ab1f3955a9d05c5ba2fadf}, intrahash = {42f77eb846bdae1847ea70ca5ba6c9ec}, journal = {Knowledge Engineering Review}, month = {December}, number = 4, timestamp = {2011-02-15 03:13:28}, title = {Review of the state of the art: Discovering and Associating Semantics to Tags in Folksonomies}, username = {dbenz}, volume = 26, year = 2011 } @book{jain1988algorithms, address = {Upper Saddle River, NJ, USA}, author = {Jain, Anil K. and Dubes, Richard C.}, file = {jain1988algorithms.pdf:jain1988algorithms.pdf:PDF}, interhash = {443a79c152c5681cdc664714b50d116c}, intrahash = {4a1adbfdc7b83b201dd8fb3e5a109609}, lastdatemodified = {2007-03-13}, lastname = {Jain}, note = {Attention: PDF is rather large (~39MB)}, own = {notown}, pdf = {jain88_algorithms.pdf}, publisher = {Prentice-Hall, Inc.}, read = {notread}, title = {Algorithms for clustering data}, url = {http://portal.acm.org/citation.cfm?id=46712}, year = 1988 } @article{limpens2008bridging, abstract = {Social tagging systems have recently became very popular as a means to classify large sets of resources shared among on-line communities over the social Web. However, the folksonomies resulting from the use of these systems revealed limitations : tags are ambiguous and their spelling may vary, and folksonomies are difficult to exploit in order to retrieve or exchange information. This article compares the recent attempts to overcome these limitations and to support the use of folksonomies with formal languages and ontologies from the Semantic Web.}, author = {Limpens, Freddy and Gandon, Fabien and Buffa, Michel}, doi = {10.1109/ASEW.2008.4686305}, file = {limpens2008bridging.pdf:limpens2008bridging.pdf:PDF}, groups = {public}, interhash = {cb1d534be80d664a50df66e8977b774e}, intrahash = {9372f9c2db8b9f4cf05b3db84e6589ac}, journal = {Automated Software Engineering - Workshops, 2008. ASE Workshops 2008. 23rd IEEE/ACM International Conference on}, journalpub = {1}, month = {Sept.}, pages = {13-18}, timestamp = {2009-07-24 14:21:18}, title = {Bridging ontologies and folksonomies to leverage knowledge sharing on the social Web: A brief survey}, username = {dbenz}, year = 2008 } @article{cimiano2006ontologies, abstract = {Ontologies are nowadays used for many applications requiring data, services and resources in general to be interoperable and machine understandable. Such applications are for example web service discovery and composition, information integration across databases, intelligent search, etc. The general idea is that data and services are semantically described with respect to ontologies,which are formal specifications of a domain of interest, and can thus be shared and reused in a way such that the shared meaning specified by the ontology remains formally the same across different parties and applications. As the cost of creating ontologies is relatively high, different proposals have emerged for learning ontologies from structured and unstructured resources. In this article we examine the maturity of techniques for ontology learning from textual resources, addressing the question whether the state-of-the-art is mature enough to produce ontologies ‘on demand’.}, author = {Cimiano, Philipp and Völker, Johanna and Studer, Rudi}, file = {cimiano2006ontologies.pdf:cimiano2006ontologies.pdf:PDF}, groups = {public}, interhash = {aeb553dc2e190f0a5974dfdc709d450a}, intrahash = {fe4c2950b5be221b493e29e4339240e8}, journal = {Information, Wissenschaft und Praxis}, journalpub = {1}, month = OCT, note = {see the special issue for more contributions related to the Semantic Web}, number = {6-7}, pages = {315-320}, timestamp = {2008-07-23 11:47:29}, title = {Ontologies on Demand? - A Description of the State-of-the-Art, Applications, Challenges and Trends for Ontology Learning from Text}, url = {\url{http://www.aifb.uni-karlsruhe.de/WBS/pci/Publications/iwp06.pdf}}, username = {dbenz}, volume = 57, year = 2006 } @article{gomezperez2004overview, abstract = {Ontology learning aims at reducing the time and efforts in the ontology development process. In recent years, several methods and tools have been proposed to speed up this process using different sources of information and different techniques. In this paper, we have reviewed 13 methods and 14 tools for semi-automatically building ontologies from texts and their relationships with the techniques each method follows. The methods have been grouped according to the main techniques followed and three groups have been identified: one based on linguistics, one on statistics, and one on machine learning. Regarding the tools, the criterion for grouping them, which has been the main aim of the tool, is to distinguish what elements of the ontology can be learned with each tool. According to this, we have identified three kinds of tools: tools for learning relations, tools for learning new concepts, and assisting tools for building up taxonomies.}, author = {G{\'o}mez-P{\'e}rez, A. and Manzano-Macho, D.}, groups = {public}, interhash = {b0343c7d442b4942ce45d280c460e69e}, intrahash = {6f9619bc5e3c08f23944c5d6b0cb8755}, issn = {0269-8889}, journal = {The knowledge engineering review}, journalpub = {1}, number = 03, pages = {187--212}, publisher = {Cambridge Univ Press}, timestamp = {2010-11-10 11:05:38}, title = {An overview of methods and tools for ontology learning from texts}, url = {http://scholar.google.de/scholar.bib?q=info:YDF0G3pSYZ0J:scholar.google.com/&output=citation&hl=de&as_sdt=2000&ct=citation&cd=31}, username = {dbenz}, volume = 19, year = 2004 } @article{shamsfard2003state, abstract = {In recent years there have been some efforts to automate the ontology acquisition and construction process. The proposed systems differ from each other in some distinguishing factors and have many features in common. This paper presents the state of the art in ontology learning (OL) and introduces a framework for classifying and comparing OL systems. The dimensions of the framework answer to questions about what to learn, from where to learn and how to learn. They include features of the input, the methods of learning and knowledge acquisition, the elements learned, the resulted ontology and also the evaluation process. To extract the framework over 50 OL systems or modules from the recent workshops, conferences and published journals are studied and seven prominent of them with most differences are selected to be compared according to our framework. In this paper after a brief description of the seven selected systems we will describe the framework dimensions. Then we will place the representative ontology learning systems into our framework. At last we will describe the differences, strengths and weaknesses of various values for our dimensions in order to present a guideline for researchers to choose the appropriate features (dimensions’ values) to create or use an OL system for their own domain or application.}, author = {Shamsfard, M. and Barforoush, A. Abdollahzadeh}, file = {shamsfard2003state.pdf:shamsfard2003state.pdf:PDF}, groups = {public}, interhash = {d3ec24d1c064b37a8e371824c700dbb9}, intrahash = {b795b85be79c66a6bef78a6ad4864736}, issn = {0269-8889}, journal = {The Knowledge Engineering Review}, journalpub = {1}, number = 04, pages = {293--316}, publisher = {Cambridge Univ Press}, timestamp = {2010-11-10 10:45:36}, title = {The state of the art in ontology learning: a framework for comparison}, url = {http://scholar.google.de/scholar.bib?q=info:xYPkmvspOF8J:scholar.google.com/&output=citation&hl=de&as_sdt=2000&ct=citation&cd=13}, username = {dbenz}, volume = 18, year = 2003 } @article{zhou2007ontology, 0 = {http://dx.doi.org/10.1007/s10799-007-0019-5}, abstract = {Abstract\ \ Ontology is one of the fundamental cornerstones of the semantic Web. The pervasive use of ontologies in information sharing and knowledge management calls for efficient and effective approaches to ontology development. Ontology learning, which seeks to discover ontological knowledge from various forms of data automatically or semi-automatically, can overcome the bottleneck of ontology acquisition in ontology development. Despite the significant progress in ontology learning research over the past decade, there remain a number of open problems in this field. This paper provides a comprehensive review and discussion of major issues, challenges, and opportunities in ontology learning. We propose a new learning-oriented model for ontology development and a framework for ontology learning. Moreover, we identify and discuss important dimensions for classifying ontology learning approaches and techniques. In light of the impact of domain on choosing ontology learning approaches, we summarize domain characteristics that can facilitate future ontology learning effort. The paper offers a road map and a variety of insights about this fast-growing field.}, at = {2009-02-13 15:22:56}, author = {Zhou, Lina}, doi = {10.1007/s10799-007-0019-5}, file = {zhou2007ontology.pdf:zhou2007ontology.pdf:PDF}, groups = {public}, interhash = {78b6d3db998dcd27c475dfff3816f48f}, intrahash = {95b0f4f7c9c628e032d8bb4c69b432ed}, journal = {Information Technology and Management}, journalpub = {1}, misc_id = {1719627}, number = 3, pages = {241--252}, priority = {3}, timestamp = {2010-06-01 16:18:37}, title = {Ontology learning: state of the art and open issues}, url = {http://www.springerlink.com/content/j4g22112l7k00833/}, username = {dbenz}, volume = 8, year = 2007 } @article{biemann2005ontology, author = {Biemann, Chris}, ee = {http://www.jlcl.org/2005_Heft2/Chris_Biemann.pdf}, file = {biemann2005ontology.pdf:biemann2005ontology.pdf:PDF}, groups = {public}, interhash = {1654cddcb952b226749bd4868c44d259}, intrahash = {32ff761ee73911a932eae6e2af8d3b24}, journal = {LDV Forum}, journalpub = {1}, number = 2, pages = {75-93}, timestamp = {2011-02-02 14:17:13}, title = {Ontology Learning from Text: A Survey of Methods.}, url = {http://dblp.uni-trier.de/db/journals/ldvf/ldvf20.html#Biemann05}, username = {dbenz}, volume = 20, year = 2005 } @article{brewster2009issues, abstract = {BACKGROUND: Ontology construction for any domain is a labour intensive and complex process. Any methodology that can reduce the cost and increase efficiency has the potential to make a major impact in the life sciences. This paper describes an experiment in ontology construction from text for the animal behaviour domain. Our objective was to see how much could be done in a simple and relatively rapid manner using a corpus of journal papers. We used a sequence of pre-existing text processing steps, and here describe the different choices made to clean the input, to derive a set of terms and to structure those terms in a number of hierarchies. We describe some of the challenges, especially that of focusing the ontology appropriately given a starting point of a heterogeneous corpus. RESULTS: Using mainly automated techniques, we were able to construct an 18055 term ontology-like structure with 73% recall of animal behaviour terms, but a precision of only 26%. We were able to clean unwanted terms from the nascent ontology using lexico-syntactic patterns that tested the validity of term inclusion within the ontology. We used the same technique to test for subsumption relationships between the remaining terms to add structure to the initially broad and shallow structure we generated. All outputs are available at http://thirlmere.aston.ac.uk/\~kiffer/animalbehaviour/. CONCLUSION: We present a systematic method for the initial steps of ontology or structured vocabulary construction for scientific domains that requires limited human effort and can make a contribution both to ontology learning and maintenance. The method is useful both for the exploration of a scientific domain and as a stepping stone towards formally rigourous ontologies. The filtering of recognised terms from a heterogeneous corpus to focus upon those that are the topic of the ontology is identified to be one of the main challenges for research in ontology learning.}, author = {Brewster, C and Jupp, S and Luciano, J and Shotton, D and Stevens, R D and Zhang, Z}, doi = {10.1186/1471-2105-10-S5-S1}, file = {brewster2009issues.pdf:brewster2009issues.pdf:PDF}, groups = {public}, interhash = {f4b4e74631a837df6c3d102731ec46c3}, intrahash = {e9a83a729df52557d560ad98404774c3}, journal = {BMC Bioinformatics}, journalpub = {1}, pmid = {19426458}, timestamp = {2011-02-02 14:18:04}, title = {Issues in learning an ontology from text}, url = {http://www.ncbi.nlm.nih.gov/pubmed/19426458}, username = {dbenz}, volume = {10 Suppl 5}, year = 2009 } @inproceedings{omelayenko2001learning, abstract = {The next generation of the Web, called Semantic Web, has to improve the Web with semantic (ontological) page annotations to enable knowledge-level querying and searches. Manual construction of these ontologies will require tremendous efforts that force future integration of machine learning with knowledge acquisition to enable highly automated ontology learning. In the paper we present the state of the-art in the field of ontology learning from the Web to see how it can contribute to the task of semantic Web querying. We consider three components of the query processing system: natural language ontologies, domain ontologies and ontology instances. We discuss the requirements for machine learning algorithms to be applied for the learning of the ontologies of each type from the Web documents, and survey the existent ontology learning and other closely related approaches.}, author = {Omelayenko, Borys}, booktitle = {Proceedings of the International Workshop on Web Dynamics, held in conj. with the 8th International Conference on Database Theory (ICDT’01), London, UK}, file = {omelayenko2001learning.pdf:omelayenko2001learning.pdf:PDF}, groups = {public}, interhash = {011d45b904b02fdf1a65122d2832710b}, intrahash = {3edf80da8b39eefeea46379581628adf}, timestamp = {2011-02-02 15:03:05}, title = {Learning of Ontologies for the Web: the Analysis of Existent Approaches}, url = {http://www.dcs.bbk.ac.uk/webDyn/webDynPapers/omelayenko.pdf}, username = {dbenz}, year = 2001 }