A Practical Algorithm for Topic Modeling with Provable Guarantees. Arora, S., Ge, R., Halpern, Y., Mimno, D. M., Moitra, A., Sontag, D., Wu, Y., & Zhu, M. In Proceedings of the International Conference on Machine Learning (ICML), volume 28 (2), pages 280–288, 2013. JMLR: W&CP.
Paper abstract bibtex Topic models provide a useful method for dimensionality reduction and exploratory data analysis in large text corpora. Most approaches to topic model learning have been based on a maximum likelihood objective. Efficient algorithms exist that attempt to approximate this objective, but they have no provable guarantees. Recently, algorithms have been introduced that provide provable bounds, but these algorithms are not practical because they are inefficient and not robust to violations of model assumptions. In this paper we present an algorithm for learning topic models that is both provable and practical. The algorithm produces results comparable to the best MCMC implementations while running orders of magnitude faster.
@inproceedings{AroraEtAl_icml13,
author = {Sanjeev Arora and Rong Ge and Yoni Halpern and David M. Mimno and Ankur Moitra and David Sontag and Yichen Wu and Michael Zhu},
title = {A Practical Algorithm for Topic Modeling with Provable Guarantees},
booktitle = {Proceedings of the International Conference on Machine Learning (ICML)},
year = {2013},
publisher = {JMLR: W\&CP},
volume = {28 (2)},
pages = {280--288},
keywords = {Machine learning, Unsupervised learning, Topic models},
url_Paper = {http://people.csail.mit.edu/dsontag/papers/AroraEtAl_icml13.pdf},
abstract = {Topic models provide a useful method for dimensionality reduction and exploratory data analysis in large text corpora. Most approaches to topic model learning have been based on a maximum likelihood objective. Efficient algorithms exist that attempt to approximate this objective, but they have no provable guarantees. Recently, algorithms have been introduced that provide provable bounds, but these algorithms are not practical because they are inefficient and not robust to violations of model assumptions. In this paper we present an algorithm for learning topic models that is both provable and practical. The algorithm produces results comparable to the best MCMC implementations while running orders of magnitude faster.}
}
Downloads: 0
{"_id":"v6f3ApoM5hYgzxqKS","bibbaseid":"arora-ge-halpern-mimno-moitra-sontag-wu-zhu-apracticalalgorithmfortopicmodelingwithprovableguarantees-2013","author_short":["Arora, S.","Ge, R.","Halpern, Y.","Mimno, D. M.","Moitra, A.","Sontag, D.","Wu, Y.","Zhu, M."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Sanjeev"],"propositions":[],"lastnames":["Arora"],"suffixes":[]},{"firstnames":["Rong"],"propositions":[],"lastnames":["Ge"],"suffixes":[]},{"firstnames":["Yoni"],"propositions":[],"lastnames":["Halpern"],"suffixes":[]},{"firstnames":["David","M."],"propositions":[],"lastnames":["Mimno"],"suffixes":[]},{"firstnames":["Ankur"],"propositions":[],"lastnames":["Moitra"],"suffixes":[]},{"firstnames":["David"],"propositions":[],"lastnames":["Sontag"],"suffixes":[]},{"firstnames":["Yichen"],"propositions":[],"lastnames":["Wu"],"suffixes":[]},{"firstnames":["Michael"],"propositions":[],"lastnames":["Zhu"],"suffixes":[]}],"title":"A Practical Algorithm for Topic Modeling with Provable Guarantees","booktitle":"Proceedings of the International Conference on Machine Learning (ICML)","year":"2013","publisher":"JMLR: W&CP","volume":"28 (2)","pages":"280–288","keywords":"Machine learning, Unsupervised learning, Topic models","url_paper":"http://people.csail.mit.edu/dsontag/papers/AroraEtAl_icml13.pdf","abstract":"Topic models provide a useful method for dimensionality reduction and exploratory data analysis in large text corpora. Most approaches to topic model learning have been based on a maximum likelihood objective. Efficient algorithms exist that attempt to approximate this objective, but they have no provable guarantees. Recently, algorithms have been introduced that provide provable bounds, but these algorithms are not practical because they are inefficient and not robust to violations of model assumptions. In this paper we present an algorithm for learning topic models that is both provable and practical. The algorithm produces results comparable to the best MCMC implementations while running orders of magnitude faster.","bibtex":"@inproceedings{AroraEtAl_icml13,\n author = {Sanjeev Arora and Rong Ge and Yoni Halpern and David M. Mimno and Ankur Moitra and David Sontag and Yichen Wu and Michael Zhu},\n title = {A Practical Algorithm for Topic Modeling with Provable Guarantees},\n booktitle = {Proceedings of the International Conference on Machine Learning (ICML)},\n year = {2013},\n publisher = {JMLR: W\\&CP},\n volume = {28 (2)},\n pages = {280--288},\n keywords = {Machine learning, Unsupervised learning, Topic models},\n url_Paper = {http://people.csail.mit.edu/dsontag/papers/AroraEtAl_icml13.pdf},\n abstract = {Topic models provide a useful method for dimensionality reduction and exploratory data analysis in large text corpora. Most approaches to topic model learning have been based on a maximum likelihood objective. Efficient algorithms exist that attempt to approximate this objective, but they have no provable guarantees. Recently, algorithms have been introduced that provide provable bounds, but these algorithms are not practical because they are inefficient and not robust to violations of model assumptions. In this paper we present an algorithm for learning topic models that is both provable and practical. The algorithm produces results comparable to the best MCMC implementations while running orders of magnitude faster.}\n}\n\n","author_short":["Arora, S.","Ge, R.","Halpern, Y.","Mimno, D. M.","Moitra, A.","Sontag, D.","Wu, Y.","Zhu, M."],"key":"AroraEtAl_icml13","id":"AroraEtAl_icml13","bibbaseid":"arora-ge-halpern-mimno-moitra-sontag-wu-zhu-apracticalalgorithmfortopicmodelingwithprovableguarantees-2013","role":"author","urls":{" paper":"http://people.csail.mit.edu/dsontag/papers/AroraEtAl_icml13.pdf"},"keyword":["Machine learning","Unsupervised learning","Topic models"],"metadata":{"authorlinks":{}},"html":""},"bibtype":"inproceedings","biburl":"http://people.csail.mit.edu/dsontag/papers/bibtex/david_sontag_papers_all.bib","dataSources":["6sSgqzaHAPRWvSxTP","g3ofqhxNQWsRWkCrp"],"keywords":["machine learning","unsupervised learning","topic models"],"search_terms":["practical","algorithm","topic","modeling","provable","guarantees","arora","ge","halpern","mimno","moitra","sontag","wu","zhu"],"title":"A Practical Algorithm for Topic Modeling with Provable Guarantees","year":2013}