@Article{wikipediaxml:2005, author = {Denoyer, Ludovic and Gallinari, Patrick}, title = {The Wikipedia XML Corpus}, journal = {SIGIR Forum}, year = {2006}, number = {}, url = {http://www-connex.lip6.fr/~denoyer/wikipediaXML/}, const = {\ text} } @Article{jiang97semantic, author = {Jiang, Jay J. and Conrath, David W.}, title = {Semantic similarity based on corpus statistics and lexical taxonomy}, journal = {CoRR}, year = {1997}, number = {}, url = {}, const = {\ text} } @Article{Lew04, author = {Lewis, D. D. and Yang, Y. and Rose, T. G. and Li, F.}, title = {RCV1: A New Benchmark Collection for Text Categorization Research}, journal = {Journal of Machine Learning Research}, year = {2004}, number = {Apr}, url = {http://www.jmlr.org/papers/volume5/lewis04a/lewis04a.pdf}, const = {\ text} } @Inproceedings{halevymadhavan2003, author = {Halevy, Alon Y. and Madhavan, Jayant}, title = {Corpus-Based Knowledge Representation}, year = {2003}, number = {}, url = {}, const = {\ text} }