@electronic{fr46.uni-saarland.de, title = {UdS :: FR 4.6:  Register im Kontakt}, url = {http://fr46.uni-saarland.de/index.php?id=regico}, biburl = {https://puma.uni-kassel.de/url/02bd78b005b224e20d38eb8b5c48d359/hotho}, keywords = {corpus dataset hd linguistics}, added-at = {2014-09-29T17:49:06.000+0200}, description = {Universität des Saarlandes,Übersetzung,Dolmetschen,Angewandte Sprachwissenschaft,UdS}, interhash = {02bd78b005b224e20d38eb8b5c48d359}, intrahash = {02bd78b005b224e20d38eb8b5c48d359} } @electronic{googleresearch.blogspot.de, title = {50,000 Lessons on How to Read: a Relation Extraction Corpus}, url = {http://googleresearch.blogspot.de/2013/04/50000-lessons-on-how-to-read-relation.html}, biburl = {https://puma.uni-kassel.de/url/581c1631a929f1162f86e02337d50478/hotho}, keywords = {corpus dataset extraction relation}, added-at = {2013-04-17T09:57:10.000+0200}, description = {}, interhash = {581c1631a929f1162f86e02337d50478}, intrahash = {581c1631a929f1162f86e02337d50478} } @electronic{trec.nist.gov, title = {Tweets2011 Twitter Collection}, url = {http://trec.nist.gov/data/tweets/}, biburl = {https://puma.uni-kassel.de/url/6114f26ca8c1a62f39518e1eadc722bc/hotho}, keywords = {corpus dataset everyaware twitter}, added-at = {2011-09-02T10:41:42.000+0200}, description = {Tweets2011 As part of the TREC 2011 microblog track, Twitter provided identifiers for approximately 16 million tweets sampled between January 23rd and February 8th, 2011. The corpus is designed to be a reusable, representative sample of the twittersphere - i.e. both important and spam tweets are included.}, interhash = {6114f26ca8c1a62f39518e1eadc722bc}, intrahash = {6114f26ca8c1a62f39518e1eadc722bc} } @electronic{www.cs.pitt.edu, title = {MPQA Releases}, url = {http://www.cs.pitt.edu/mpqa/}, biburl = {https://puma.uni-kassel.de/url/f1343ddd814a4f0fb5cdb52db55afa0b/hotho}, keywords = {corpus dataset mpqa opinion}, added-at = {2010-03-17T11:31:14.000+0100}, description = {}, interhash = {f1343ddd814a4f0fb5cdb52db55afa0b}, intrahash = {f1343ddd814a4f0fb5cdb52db55afa0b} } @electronic{devoted.to, title = {David Lee's Bookmarks for Corpus-based Linguists}, url = {http://devoted.to/corpora}, biburl = {https://puma.uni-kassel.de/url/714a6270040c564229df5c60db472484/hotho}, keywords = {corpus dataset lecture nlp survey}, added-at = {2008-04-29T15:03:05.000+0200}, description = {}, interhash = {714a6270040c564229df5c60db472484}, intrahash = {714a6270040c564229df5c60db472484} } @electronic{www.grsampson.net, title = {Geoffrey Sampson: Downloadable Resources}, url = {http://www.grsampson.net/Resources.html}, biburl = {https://puma.uni-kassel.de/url/85e6aa977e160d792141038d38915682/hotho}, keywords = {corpus dataset lecture nlp tm}, added-at = {2008-04-29T12:09:45.000+0200}, description = {}, interhash = {85e6aa977e160d792141038d38915682}, intrahash = {85e6aa977e160d792141038d38915682} } @electronic{www.linguistlist.org, title = {Linguist List - Web Resource Listings}, url = {http://www.linguistlist.org/sp/Texts.html}, biburl = {https://puma.uni-kassel.de/url/70d16dc2e74cf3bb1f8fe4f8dbd8f17f/hotho}, keywords = {corpus dataset lecture nlp}, added-at = {2008-04-29T12:06:42.000+0200}, description = {}, interhash = {70d16dc2e74cf3bb1f8fe4f8dbd8f17f}, intrahash = {70d16dc2e74cf3bb1f8fe4f8dbd8f17f} } @electronic{aune.lpl.univ-aix.fr, title = {Multext}, url = {http://aune.lpl.univ-aix.fr/projects/multext/}, biburl = {https://puma.uni-kassel.de/url/aadc8b8fde1c4cc4affcfa02f649f6be/hotho}, keywords = {corpus dataset text}, added-at = {2007-11-16T17:36:20.000+0100}, description = {}, interhash = {aadc8b8fde1c4cc4affcfa02f649f6be}, intrahash = {aadc8b8fde1c4cc4affcfa02f649f6be} } @electronic{plg.uwaterloo.ca, title = {Trec Spam Corpus}, url = {http://plg.uwaterloo.ca/~gvcormac/treccorpus/}, biburl = {https://puma.uni-kassel.de/url/612bf65a435736bdb79b895c6b070429/hotho}, keywords = {trec spam set data dataset corpus}, added-at = {2006-09-04T15:42:51.000+0200}, description = {}, interhash = {612bf65a435736bdb79b895c6b070429}, intrahash = {612bf65a435736bdb79b895c6b070429} } @electronic{sinai.ujaen.es, title = {HepCorpus - Sinai}, url = {http://sinai.ujaen.es/wiki/index.php/HepCorpus#English_version}, biburl = {https://puma.uni-kassel.de/url/2a94f6d49e5f0d09fcd7d47ead339d62/hotho}, keywords = {text dataset corpus}, added-at = {2006-05-29T15:53:16.000+0200}, description = {}, interhash = {2a94f6d49e5f0d09fcd7d47ead339d62}, intrahash = {2a94f6d49e5f0d09fcd7d47ead339d62} } @electronic{www.bmanuel.org, title = {Manuel Barbera, Corpus based computational linguistic resources. General: E-Texts (§ 2.3).}, url = {http://www.bmanuel.org/clr2_et.html}, biburl = {https://puma.uni-kassel.de/url/35e334c2b9116aa25f7e10bed79d0347/hotho}, keywords = {text dataset corpus}, added-at = {2006-05-26T08:21:51.000+0200}, description = {Electronic Literary Text Archives.}, interhash = {35e334c2b9116aa25f7e10bed79d0347}, intrahash = {35e334c2b9116aa25f7e10bed79d0347} } @electronic{muchmore.dfki.de, title = {much.more}, url = {http://muchmore.dfki.de/resources_index.htm}, biburl = {https://puma.uni-kassel.de/url/5f2e4b0e4d51a2d01853a889f021fee3/hotho}, keywords = {dataset corpus}, added-at = {2006-04-07T10:58:58.000+0200}, description = {A number of resources have been compiled within the context of the MuchMore project. These include: a bilingual, parallel medical corpus; corresponding queries and relevance assessments; evaluation sets of disambiguated terms for GermaNet and UMLS; an evaluation list for morphological decomposition of medical terms.}, interhash = {5f2e4b0e4d51a2d01853a889f021fee3}, intrahash = {5f2e4b0e4d51a2d01853a889f021fee3} }