@book{manning1999foundations, address = {Cambridge, MA}, author = {Manning, C. and Sch\"utze, H.}, interhash = {a81df02f92f266a51183fe936f588a08}, intrahash = {e2f05fae5d02f579a85a10b79edf1d99}, publisher = {MIT Press}, title = {Foundations of statistical natural language processing}, year = 1999 } @article{spence1990lexical, abstract = {The 1-million-word Brown corpus was searched for co-occurrences of semantically related pairs of concrete nouns appearing within an arbitrary window of 250 characters. Related pairs of nouns (OCEAN-WATER) co-occur significantly more often than matched, unrelated pairs (OCEAN-HAND), and this difference remained significant within blocks of text up to 1000 characters in length. Frequency of co-occurrence, corrected for chance, is significantly correlated with association strength. Lexical distance between co-occurring members of a given pair is inversely correlated with association strength. Significantly more co-occurrences were found, per unit text, in the fictional sections of the corpus.}, affiliation = {Department of Psychiatry Robert Wood Johnson Medical School 08854 Piscataway New Jersey}, author = {Spence, Donald P. and Owens, Kimberly C.}, doi = {10.1007/BF01074363}, interhash = {75d5913fcca51ebf5fd7e281c36a69e9}, intrahash = {3e0a291d4193c824616c6f73ad0a4101}, issn = {0090-6905}, issue = {5}, journal = {Journal of Psycholinguistic Research }, keyword = {Behavioral Science}, pages = {317-330}, publisher = {Springer Netherlands}, title = {Lexical co-occurrence and association strength}, url = {http://dx.doi.org/10.1007/BF01074363}, volume = 19, year = 1990 } @inproceedings{liu2006web, author = {Liu, Vinci and Curran, James R.}, booktitle = {EACL}, crossref = {conf/eacl/2006}, ee = {http://acl.ldc.upenn.edu/E/E06/E06-1030.pdf}, interhash = {f966023df4185e781314340265d3df1f}, intrahash = {934a38bd8d7696cff1da3a2df3724407}, isbn = {1-932432-59-0}, publisher = {The Association for Computer Linguistics}, title = {Web Text Corpus for Natural Language Processing.}, url = {http://dblp.uni-trier.de/db/conf/eacl/eacl2006.html#LiuC06}, year = 2006 } @book{helbig2008wissensverarbeitung, abstract = {Das Buch gibt eine umfassende Darstellung einer Methodik zur Interpretation und Bedeutungsrepr{\"a}sentation nat{\"u}rlichsprachlicher Ausdr{\"u}cke. Diese Methodik der Mehrschichtigen Erweiterten Semantischen Netze (MultiNet) ist sowohl f{\"u}r theoretische Untersuchungen als auch f{\"u}r die automatische Verarbeitung nat{\"u}rlicher Sprache auf dem Rechner geeignet. Die vorgestellten Ergebnisse sind eingebettet in ein System von Software-Werkzeugen, die eine praktische Nutzung der MultiNet-Darstellungsmittel als Formalismus zur Bedeutungsrepr{\"a}sentation sichern. Hierzu geh{\"o}ren: eine Werkbank f{\"u}r den Wissensingenieur, ein {\"U}bersetzungssystem zur automatischen Gewinnung von Bedeutungsdarstellungen nat{\"u}rlichsprachlicher S{\"a}tze und eine Werkbank f{\"u}r den Computerlexikographen.}, address = {Berlin}, author = {Helbig, Hermann}, doi = {10.1007/978-3-540-76278-2}, edition = {2.}, file = {Amazon Search inside:http\://www.amazon.de/gp/reader/3540762760/:URL}, interhash = {f7c09fb5257be21200f6a9622c5d301c}, intrahash = {6eff05ef4aa01e934aa45df7a7ad3154}, isbn = {3-540-76276-0}, publisher = {Springer}, title = {{Wissensverarbeitung und die Semantik der nat{\"u}rlichen Sprache: Wissensrepr{\"a}sentation mit MultiNet}}, year = 2008 } @inproceedings{jarmasz2003rogets, abstract = {We have implemented a system that measures semantic similarity using a computerized 1987 Roget's Thesaurus, and evaluated it by performing a few typical tests. We compare the results of these tests with those produced by WordNet-based similarity measures. One of the benchmarks is Miller and Charles� list of 30 noun pairs to which human judges had assigned similarity measures. We correlate these measures with those computed by several NLP systems. The 30 pairs can be traced back to Rubenstein and Goodenough�s 65 pairs, which we have also studied. Our Roget�s-based system gets correlations of .878 for the smaller and .818 for the larger list of noun pairs; this is quite close to the .885 that Resnik obtained when he employed humans to replicate the Miller and Charles experiment. We further evaluate our measure by using Roget�s and WordNet to answer 80 TOEFL, 50 ESL and 300 Reader�s Digest questions: the correct synonym must be selected amongst a group of four words. Our system gets 78.75\%, 82.00\% and 74.33\% of the questions respectively.}, author = {Jarmasz, Mario and Szpakowicz, Stan}, booktitle = {Conference on Recent Advances in Natural Language Processing}, interhash = {e28cc3a4231e064f44cfdb2e3338aaf3}, intrahash = {acde39a427ef0e7501f07e8b067a88f0}, pages = {212--219}, title = {Roget's thesaurus and semantic similarity}, url = {http://www.site.uottawa.ca/~mjarmasz/pubs/jarmasz_roget_sim.pdf}, year = 2003 } @book{jurafsky2000speech, asin = {0130950696}, author = {Jurafsky, Daniel and Martin, James H.}, dewey = {410.285}, ean = {9780130950697}, edition = 1, interhash = {ae1205b1f526d068fc9364510bf99418}, intrahash = {25110e6691b5ee9dbe97216ce087487f}, isbn = {0130950696}, note = {neue Auflage kommt im Frühjahr 2008}, publisher = {Prentice Hall}, title = {Speech and Language Processing: An Introduction to Natural Language Processing, Computational Linguistics and Speech Recognition (Prentice Hall Series in Artificial Intelligence)}, url = {http://www.amazon.com/gp/redirect.html%3FASIN=0130950696%26tag=ws%26lcode=xm2%26cID=2025%26ccmID=165953%26location=/o/ASIN/0130950696%253FSubscriptionId=13CT5CVB80YFWJEPWS02}, year = 2000 } @inproceedings{cimiano2003automaticb, author = {Cimiano, Philipp and Staab, Steffen and Tane, Julien}, booktitle = {Proceedings of the ECML/PKDD Workshop on Adaptive Text Extraction and Mining, Cavtat-Dubrovnik, Croatia}, interhash = {2f9df79fa0d890faa91dc1d0d0def735}, intrahash = {c62b4e1dc65490d68bef7eaed01f83ea}, lastdatemodified = {2007-03-22}, lastname = {Cimiano}, own = {notown}, pages = {10-17}, pdf = {cimiano03-automatic.pdf}, read = {notread}, title = {Automatic Acquisition of Taxonomies from Text: FCA meets NLP}, url = {\url{http://www.aifb.uni-karlsruhe.de/WBS/pci/ontolearning.pdf}}, year = 2003 }