@electronic{fr46.uni-saarland.de, title = {UdS :: FR 4.6:  Register im Kontakt}, url = {http://fr46.uni-saarland.de/index.php?id=regico}, biburl = {https://puma.uni-kassel.de/url/02bd78b005b224e20d38eb8b5c48d359/hotho}, keywords = {corpus dataset hd linguistics}, added-at = {2014-09-29T17:49:06.000+0200}, description = {Universität des Saarlandes,Übersetzung,Dolmetschen,Angewandte Sprachwissenschaft,UdS}, interhash = {02bd78b005b224e20d38eb8b5c48d359}, intrahash = {02bd78b005b224e20d38eb8b5c48d359} } @electronic{trec.nist.gov, title = {Tweets2011 Twitter Collection}, url = {http://trec.nist.gov/data/tweets/}, biburl = {https://puma.uni-kassel.de/url/6114f26ca8c1a62f39518e1eadc722bc/hotho}, keywords = {corpus dataset everyaware twitter}, added-at = {2011-09-02T10:41:42.000+0200}, description = {Tweets2011 As part of the TREC 2011 microblog track, Twitter provided identifiers for approximately 16 million tweets sampled between January 23rd and February 8th, 2011. The corpus is designed to be a reusable, representative sample of the twittersphere - i.e. both important and spam tweets are included.}, interhash = {6114f26ca8c1a62f39518e1eadc722bc}, intrahash = {6114f26ca8c1a62f39518e1eadc722bc} } @electronic{plg.uwaterloo.ca, title = {Trec Spam Corpus}, url = {http://plg.uwaterloo.ca/~gvcormac/treccorpus/}, biburl = {https://puma.uni-kassel.de/url/612bf65a435736bdb79b895c6b070429/hotho}, keywords = {trec spam set data dataset corpus}, added-at = {2006-09-04T15:42:51.000+0200}, description = {}, interhash = {612bf65a435736bdb79b895c6b070429}, intrahash = {612bf65a435736bdb79b895c6b070429} } @electronic{aune.lpl.univ-aix.fr, title = {Multext}, url = {http://aune.lpl.univ-aix.fr/projects/multext/}, biburl = {https://puma.uni-kassel.de/url/aadc8b8fde1c4cc4affcfa02f649f6be/hotho}, keywords = {corpus dataset text}, added-at = {2007-11-16T17:36:20.000+0100}, description = {}, interhash = {aadc8b8fde1c4cc4affcfa02f649f6be}, intrahash = {aadc8b8fde1c4cc4affcfa02f649f6be} } @electronic{muchmore.dfki.de, title = {much.more}, url = {http://muchmore.dfki.de/resources_index.htm}, biburl = {https://puma.uni-kassel.de/url/5f2e4b0e4d51a2d01853a889f021fee3/hotho}, keywords = {dataset corpus}, added-at = {2006-04-07T10:58:58.000+0200}, description = {A number of resources have been compiled within the context of the MuchMore project. These include: a bilingual, parallel medical corpus; corresponding queries and relevance assessments; evaluation sets of disambiguated terms for GermaNet and UMLS; an evaluation list for morphological decomposition of medical terms.}, interhash = {5f2e4b0e4d51a2d01853a889f021fee3}, intrahash = {5f2e4b0e4d51a2d01853a889f021fee3} } @electronic{www.cs.pitt.edu, title = {MPQA Releases}, url = {http://www.cs.pitt.edu/mpqa/}, biburl = {https://puma.uni-kassel.de/url/f1343ddd814a4f0fb5cdb52db55afa0b/hotho}, keywords = {corpus dataset mpqa opinion}, added-at = {2010-03-17T11:31:14.000+0100}, description = {}, interhash = {f1343ddd814a4f0fb5cdb52db55afa0b}, intrahash = {f1343ddd814a4f0fb5cdb52db55afa0b} } @electronic{www.bmanuel.org, title = {Manuel Barbera, Corpus based computational linguistic resources. General: E-Texts (§ 2.3).}, url = {http://www.bmanuel.org/clr2_et.html}, biburl = {https://puma.uni-kassel.de/url/35e334c2b9116aa25f7e10bed79d0347/hotho}, keywords = {text dataset corpus}, added-at = {2006-05-26T08:21:51.000+0200}, description = {Electronic Literary Text Archives.}, interhash = {35e334c2b9116aa25f7e10bed79d0347}, intrahash = {35e334c2b9116aa25f7e10bed79d0347} } @electronic{www.linguistlist.org, title = {Linguist List - Web Resource Listings}, url = {http://www.linguistlist.org/sp/Texts.html}, biburl = {https://puma.uni-kassel.de/url/70d16dc2e74cf3bb1f8fe4f8dbd8f17f/hotho}, keywords = {corpus dataset lecture nlp}, added-at = {2008-04-29T12:06:42.000+0200}, description = {}, interhash = {70d16dc2e74cf3bb1f8fe4f8dbd8f17f}, intrahash = {70d16dc2e74cf3bb1f8fe4f8dbd8f17f} } @electronic{sinai.ujaen.es, title = {HepCorpus - Sinai}, url = {http://sinai.ujaen.es/wiki/index.php/HepCorpus#English_version}, biburl = {https://puma.uni-kassel.de/url/2a94f6d49e5f0d09fcd7d47ead339d62/hotho}, keywords = {text dataset corpus}, added-at = {2006-05-29T15:53:16.000+0200}, description = {}, interhash = {2a94f6d49e5f0d09fcd7d47ead339d62}, intrahash = {2a94f6d49e5f0d09fcd7d47ead339d62} } @electronic{www.grsampson.net, title = {Geoffrey Sampson: Downloadable Resources}, url = {http://www.grsampson.net/Resources.html}, biburl = {https://puma.uni-kassel.de/url/85e6aa977e160d792141038d38915682/hotho}, keywords = {corpus dataset lecture nlp tm}, added-at = {2008-04-29T12:09:45.000+0200}, description = {}, interhash = {85e6aa977e160d792141038d38915682}, intrahash = {85e6aa977e160d792141038d38915682} } @electronic{devoted.to, title = {David Lee's Bookmarks for Corpus-based Linguists}, url = {http://devoted.to/corpora}, biburl = {https://puma.uni-kassel.de/url/714a6270040c564229df5c60db472484/hotho}, keywords = {corpus dataset lecture nlp survey}, added-at = {2008-04-29T15:03:05.000+0200}, description = {}, interhash = {714a6270040c564229df5c60db472484}, intrahash = {714a6270040c564229df5c60db472484} } @electronic{googleresearch.blogspot.de, title = {50,000 Lessons on How to Read: a Relation Extraction Corpus}, url = {http://googleresearch.blogspot.de/2013/04/50000-lessons-on-how-to-read-relation.html}, biburl = {https://puma.uni-kassel.de/url/581c1631a929f1162f86e02337d50478/hotho}, keywords = {corpus dataset extraction relation}, added-at = {2013-04-17T09:57:10.000+0200}, description = {}, interhash = {581c1631a929f1162f86e02337d50478}, intrahash = {581c1631a929f1162f86e02337d50478} }