@electronic{infochimps.org, title = {Twitter data sets for download - Infochimps}, url = {http://infochimps.org/tags/twitter}, biburl = {https://puma.uni-kassel.de/url/6d90faa71befc28ab285391e88270b86/benz}, keywords = {dataset download twitter}, added-at = {2011-02-04T16:07:23.000+0100}, description = {}, interhash = {6d90faa71befc28ab285391e88270b86}, intrahash = {6d90faa71befc28ab285391e88270b86} } @electronic{evanjones.ca, title = {Extracting Text from Wikipedia}, url = {http://evanjones.ca/software/wikipedia2text.html}, biburl = {https://puma.uni-kassel.de/url/7ee155b9d5b03240e99556cbf828f202/benz}, keywords = {data dataset plain_text python text tool wiki wikipedia}, added-at = {2011-02-04T16:07:25.000+0100}, description = {}, interhash = {7ee155b9d5b03240e99556cbf828f202}, intrahash = {7ee155b9d5b03240e99556cbf828f202} } @electronic{www.p2p.tu-darmstadt.de, title = {Research}, url = {http://www.p2p.tu-darmstadt.de/research/}, biburl = {https://puma.uni-kassel.de/url/f518aee1c775b508e6145577ba08264a/benz}, keywords = {dataset social_networks socialnetwork}, added-at = {2011-02-04T16:07:27.000+0100}, description = {}, interhash = {f518aee1c775b508e6145577ba08264a}, intrahash = {f518aee1c775b508e6145577ba08264a} } @electronic{socialnetworks.mpi-sws.org, title = {Online Social Networks Research @MPI-SWS}, url = {http://socialnetworks.mpi-sws.org/}, biburl = {https://puma.uni-kassel.de/url/bd1d323860ba4faafd18250421c1dc94/benz}, keywords = {dataset download misvlove social_network}, added-at = {2011-02-04T16:07:28.000+0100}, description = {}, interhash = {bd1d323860ba4faafd18250421c1dc94}, intrahash = {bd1d323860ba4faafd18250421c1dc94} } @electronic{www.eml-research.de, title = {Download Wikipedia Category Taxonomy}, url = {http://www.eml-research.de/english/research/nlp/download/wikitaxonomy.php}, biburl = {https://puma.uni-kassel.de/url/9d33bae08b8defaa95cda39608876bf6/benz}, keywords = {categories category_hierarchy dataset download hierarchy ontology taxonomy wikipedia}, added-at = {2011-02-04T16:07:33.000+0100}, description = {}, interhash = {9d33bae08b8defaa95cda39608876bf6}, intrahash = {9d33bae08b8defaa95cda39608876bf6} } @electronic{twapperkeeper.com, title = {Twapper Keeper - Archive Tweets}, url = {http://twapperkeeper.com/}, biburl = {https://puma.uni-kassel.de/url/273e6fdd06c89ce7a09eeb2b1598ee09/benz}, keywords = {dataset twapper twapper_keeper twitter}, added-at = {2011-02-04T16:07:48.000+0100}, description = {Allows you to archive and organize your tweets based upon hash tags.}, interhash = {273e6fdd06c89ce7a09eeb2b1598ee09}, intrahash = {273e6fdd06c89ce7a09eeb2b1598ee09} } @electronic{www.mail-archive.com, title = {[twitter-dev] Re: Tweet Corpus creation for NLP research}, url = {http://www.mail-archive.com/twitter-development-talk@googlegroups.com/msg05715.html}, biburl = {https://puma.uni-kassel.de/url/1b9716d1f2674e18b3016d3ac6edc16a/benz}, keywords = {dataset twitter}, added-at = {2011-02-04T16:07:48.000+0100}, description = {}, interhash = {1b9716d1f2674e18b3016d3ac6edc16a}, intrahash = {1b9716d1f2674e18b3016d3ac6edc16a} } @electronic{www.yr-bcn.es, title = {Semantically Annotated Snapshot of the English Wikipedia (SW v.1)}, url = {http://www.yr-bcn.es/semanticWikipedia}, biburl = {https://puma.uni-kassel.de/url/a703bcf3b3890f8a4a61f052228bae8f/benz}, keywords = {semantics dataset wikipedia annotated ontology}, added-at = {2011-02-04T16:08:40.000+0100}, description = {}, interhash = {a703bcf3b3890f8a4a61f052228bae8f}, intrahash = {a703bcf3b3890f8a4a61f052228bae8f} } @electronic{www.pearsonlongman.com, title = {Longman Dictionaries - Dictionaries for Research}, url = {http://www.pearsonlongman.com/dictionaries/research/dict-research.html}, biburl = {https://puma.uni-kassel.de/url/30a773117f918e4d932e0c64e5ec6a38/benz}, keywords = {dataset dictionary disambiguation ldoce}, added-at = {2011-02-18T23:23:09.000+0100}, description = {Pearson Longman English Language Teaching (Pearson Longman ELT) is a leading educational publisher of quality resources for all ages and abilities across the curriculum, providing solutions for teachers and students.}, interhash = {30a773117f918e4d932e0c64e5ec6a38}, intrahash = {30a773117f918e4d932e0c64e5ec6a38} } @electronic{pig.apache.org, title = {Welcome to Apache Pig!}, url = {http://pig.apache.org/}, biburl = {https://puma.uni-kassel.de/url/a16819a4998a5d215dd1b28d7ebd6f18/hotho}, keywords = {analysis dataset datastore large pig}, added-at = {2011-03-14T18:59:41.000+0100}, description = {}, interhash = {a16819a4998a5d215dd1b28d7ebd6f18}, intrahash = {a16819a4998a5d215dd1b28d7ebd6f18} } @electronic{web-ngram.research.microsoft.com, title = {Microsoft Research - Speller Challenge Datasets}, url = {http://web-ngram.research.microsoft.com/spellerchallenge/DataSets.aspx}, biburl = {https://puma.uni-kassel.de/url/ec1f2805048b9ac374691a1774514620/benz}, keywords = {challenge dataset search_engine speller_challenge spelling}, added-at = {2011-03-16T23:23:07.000+0100}, description = {Microsoft Research Speller Challenge}, interhash = {ec1f2805048b9ac374691a1774514620}, intrahash = {ec1f2805048b9ac374691a1774514620} } @electronic{an.kaist.ac.kr, title = {What is Twitter, a Social Network or a News Media? - WWW'10}, url = {http://an.kaist.ac.kr/traces/WWW2010.html}, biburl = {https://puma.uni-kassel.de/url/39fbd40f2a9a8d4682162507b2a41924/hotho}, keywords = {dataset network social twitter}, added-at = {2011-03-24T10:18:26.000+0100}, description = {}, interhash = {39fbd40f2a9a8d4682162507b2a41924}, intrahash = {39fbd40f2a9a8d4682162507b2a41924} } @electronic{d8taplex.com, title = {d8taplex}, url = {http://d8taplex.com/}, biburl = {https://puma.uni-kassel.de/url/9eb6a8822bb92c8b8927be72ef87b847/hotho}, keywords = {data dataset discovery exploration visualization web}, added-at = {2011-05-03T10:18:57.000+0200}, description = {d8taplex helps you discover, visualize and explore data found on the web including time series data}, interhash = {9eb6a8822bb92c8b8927be72ef87b847}, intrahash = {9eb6a8822bb92c8b8927be72ef87b847} } @electronic{d8taplex.com, title = {Datasets}, url = {http://d8taplex.com/directory/directory.html}, biburl = {https://puma.uni-kassel.de/url/12f0b282945915b09de3b87be9948ab0/hotho}, keywords = {dataset series time}, added-at = {2011-05-03T10:19:39.000+0200}, description = {}, interhash = {12f0b282945915b09de3b87be9948ab0}, intrahash = {12f0b282945915b09de3b87be9948ab0} } @electronic{code.richrelevance.com, title = {RecLab Core -}, url = {http://code.richrelevance.com/reclab-core/}, biburl = {https://puma.uni-kassel.de/url/e9702e7751ffd591cca67add470d3f6b/hotho}, keywords = {algorithm challenge data dataset development improvement method recommender}, added-at = {2011-05-26T11:48:26.000+0200}, description = {}, interhash = {e9702e7751ffd591cca67add470d3f6b}, intrahash = {e9702e7751ffd591cca67add470d3f6b} } @electronic{trec.nist.gov, title = {Tweets2011 Twitter Collection}, url = {http://trec.nist.gov/data/tweets/}, biburl = {https://puma.uni-kassel.de/url/6114f26ca8c1a62f39518e1eadc722bc/hotho}, keywords = {corpus dataset everyaware twitter}, added-at = {2011-09-02T10:41:42.000+0200}, description = {Tweets2011 As part of the TREC 2011 microblog track, Twitter provided identifiers for approximately 16 million tweets sampled between January 23rd and February 8th, 2011. The corpus is designed to be a reusable, representative sample of the twittersphere - i.e. both important and spam tweets are included.}, interhash = {6114f26ca8c1a62f39518e1eadc722bc}, intrahash = {6114f26ca8c1a62f39518e1eadc722bc} } @electronic{www.prosper.com, title = {Academics - Prosper}, url = {http://www.prosper.com/about/academics.aspx}, biburl = {https://puma.uni-kassel.de/url/32ce80d74cdbad83e6aeced721034f28/hotho}, keywords = {data dataset research}, added-at = {2011-09-05T17:04:47.000+0200}, description = {If you are interested in doing research on Prosper or using Prosper data in support of your research, please contact us.}, interhash = {32ce80d74cdbad83e6aeced721034f28}, intrahash = {32ce80d74cdbad83e6aeced721034f28} } @electronic{arnetminer.org, title = {Citation Network Dataset}, url = {http://arnetminer.org/citation}, biburl = {https://puma.uni-kassel.de/url/e161aac032d6db0c923066015bb6a147/stephandoerfel}, keywords = {arnetminer citation dataset}, added-at = {2011-09-15T15:22:45.000+0200}, description = {}, interhash = {e161aac032d6db0c923066015bb6a147}, intrahash = {e161aac032d6db0c923066015bb6a147} } @electronic{reality.media.mit.edu, title = {MIT Media Lab: Reality Mining}, url = {http://reality.media.mit.edu/}, biburl = {https://puma.uni-kassel.de/url/365294ebae4828f93aca9d32ab116908/hotho}, keywords = {data dm everyaware lab media mining reality traces dataset}, added-at = {2011-09-30T08:49:38.000+0200}, description = {}, interhash = {365294ebae4828f93aca9d32ab116908}, intrahash = {365294ebae4828f93aca9d32ab116908} } @electronic{webscope.sandbox.yahoo.com, title = {Webscope from Yahoo! Labs}, url = {http://webscope.sandbox.yahoo.com/catalog.php}, biburl = {https://puma.uni-kassel.de/url/d9da5f26b324d77524cf2bc5716c04a7/hotho}, keywords = {language search web dataset}, added-at = {2011-10-04T17:49:26.000+0200}, description = {}, interhash = {d9da5f26b324d77524cf2bc5716c04a7}, intrahash = {d9da5f26b324d77524cf2bc5716c04a7} }