@inproceedings{journals/jmlr/ChangB09, author = {Chang, Jonathan and Blei, David M.}, booktitle = {AISTATS}, crossref = {conf/aistats/2009}, editor = {Dyk, David A. Van and Welling, Max}, ee = {http://www.jmlr.org/proceedings/papers/v5/chang09a.html}, interhash = {f3431fd69b315a22422a2c0f15ee0b71}, intrahash = {86f665b74ecabb56e81542e0f052a331}, pages = {81-88}, publisher = {JMLR.org}, series = {JMLR Proceedings}, title = {Relational Topic Models for Document Networks.}, url = {http://dblp.uni-trier.de/db/journals/jmlr/jmlrp5.html#ChangB09}, volume = 5, year = 2009 } @inproceedings{chang2009reading, abstract = {Probabilistic topic models are a popular tool for the unsupervised analysis of text, providing both a predictive model of future text and a latent topic representation of the corpus. Practitioners typically assume that the latent space is semantically meaningful. It is used to check models, summarize the corpus, and guide exploration of its contents. However, whether the latent space is interpretable is in need of quantitative evaluation. In this paper, we present new quantitative methods for measuring semantic meaning in inferred topics. We back these measures with large-scale user studies, showing that they capture aspects of the model that are undetected by previous measures of model quality based on held-out likelihood. Surprisingly, topic models which perform better on held-out likelihood may infer less semantically meaningful topics.}, author = {Chang, Jonathan and Boyd-Graber, Jordan L. and Gerrish, Sean and Wang, Chong and Blei, David M.}, booktitle = {NIPS}, editor = {Bengio, Yoshua and Schuurmans, Dale and Lafferty, John D. and Williams, Christopher K. I. and Culotta, Aron}, interhash = {48210cee941ee21e6282798e28270a6d}, intrahash = {cd4cf8ff8a676ca7bbc4201ddbc2d024}, isbn = {9781615679119}, pages = {288--296}, publisher = {Curran Associates, Inc.}, title = {Reading Tea Leaves: How Humans Interpret Topic Models}, url = {http://books.nips.cc/papers/files/nips22/NIPS2009_0125.pdf}, year = 2009 } @incollection{griffiths_05, address = {Cambridge, MA}, author = {{Griffiths}, Thomas L. and {Steyvers}, Mark and {Blei}, David M. and {Tenenbaum}, Joshua B.}, booktitle = {Advances in Neural Information Processing Systems 17}, editor = {Saul, Lawrence K. and Weiss, Yair and Bottou, {L\'{e}on}}, interhash = {7d2594aa4b9905370ef001eebb6461b7}, intrahash = {dd89145403b46fc5315d3206f89bb09b}, owner = {heinrich}, pages = {537-544}, publisher = {MIT Press}, title = {Integrating Topics and Syntax}, volume = 17, year = 2005 } @article{Blei+Ng+Jordan:03a, author = {Blei, David M. and Ng, Andrew Y. and Jordan, Michael I.}, interhash = {9d1b808272b9e511425cbf557571e59a}, intrahash = {cbccc8032ce2763326dbe5de19c58aaf}, journal = {Journal of Machine Learning Research}, pages = {993--1022}, title = {Latent {Dirichlet} Allocation}, volume = 3, year = 2003 }