On the Quantitative Analysis of Deep Belief Networks

On the Quantitative Analysis of Deep Belief Networks. Salakhutdinov, R. & Murray, I. In Proceedings of the 25th International Conference on Machine Learning, of ICML '08, pages 872--879, New York, NY, USA, 2008. ACM. 00129

Paper doi abstract bibtex

Deep Belief Networks (DBN's) are generative models that contain many layers of hidden variables. Efficient greedy algorithms for learning and approximate inference have allowed these models to be applied successfully in many application domains. The main building block of a DBN is a bipartite undirected graphical model called a restricted Boltzmann machine (RBM). Due to the presence of the partition function, model selection, complexity control, and exact maximum likelihood learning in RBM's are intractable. We show that Annealed Importance Sampling (AIS) can be used to efficiently estimate the partition function of an RBM, and we present a novel AIS scheme for comparing RBM's with different architectures. We further show how an AIS estimator, along with approximate inference, can be used to estimate a lower bound on the log-probability that a DBN model with multiple hidden layers assigns to the test data. This is, to our knowledge, the first step towards obtaining quantitative results that would allow us to directly assess the performance of Deep Belief Networks as generative models of data.

@inproceedings{ salakhutdinov_quantitative_2008,
  address = {New York, NY, USA},
  series = {{ICML} '08},
  title = {On the {Quantitative} {Analysis} of {Deep} {Belief} {Networks}},
  isbn = {978-1-60558-205-4},
  url = {http://doi.acm.org/10.1145/1390156.1390266},
  doi = {10.1145/1390156.1390266},
  abstract = {Deep Belief Networks (DBN's) are generative models that contain many layers of hidden variables. Efficient greedy algorithms for learning and approximate inference have allowed these models to be applied successfully in many application domains. The main building block of a DBN is a bipartite undirected graphical model called a restricted Boltzmann machine (RBM). Due to the presence of the partition function, model selection, complexity control, and exact maximum likelihood learning in RBM's are intractable. We show that Annealed Importance Sampling (AIS) can be used to efficiently estimate the partition function of an RBM, and we present a novel AIS scheme for comparing RBM's with different architectures. We further show how an AIS estimator, along with approximate inference, can be used to estimate a lower bound on the log-probability that a DBN model with multiple hidden layers assigns to the test data. This is, to our knowledge, the first step towards obtaining quantitative results that would allow us to directly assess the performance of Deep Belief Networks as generative models of data.},
  urldate = {2015-05-03TZ},
  booktitle = {Proceedings of the 25th {International} {Conference} on {Machine} {Learning}},
  publisher = {ACM},
  author = {Salakhutdinov, Ruslan and Murray, Iain},
  year = {2008},
  note = {00129},
  pages = {872--879}
}

Downloads: 0

{"_id":"tAEPxgNyYHwcMK73s","bibbaseid":"salakhutdinov-murray-onthequantitativeanalysisofdeepbeliefnetworks-2008","downloads":0,"creationDate":"2015-09-03T07:18:47.281Z","title":"On the Quantitative Analysis of Deep Belief Networks","author_short":["Salakhutdinov, R.","Murray, I."],"year":2008,"bibtype":"inproceedings","biburl":"http://bibbase.org/zotero/fred.qi","bibdata":{"abstract":"Deep Belief Networks (DBN's) are generative models that contain many layers of hidden variables. Efficient greedy algorithms for learning and approximate inference have allowed these models to be applied successfully in many application domains. The main building block of a DBN is a bipartite undirected graphical model called a restricted Boltzmann machine (RBM). Due to the presence of the partition function, model selection, complexity control, and exact maximum likelihood learning in RBM's are intractable. We show that Annealed Importance Sampling (AIS) can be used to efficiently estimate the partition function of an RBM, and we present a novel AIS scheme for comparing RBM's with different architectures. We further show how an AIS estimator, along with approximate inference, can be used to estimate a lower bound on the log-probability that a DBN model with multiple hidden layers assigns to the test data. This is, to our knowledge, the first step towards obtaining quantitative results that would allow us to directly assess the performance of Deep Belief Networks as generative models of data.","address":"New York, NY, USA","author":["Salakhutdinov, Ruslan","Murray, Iain"],"author_short":["Salakhutdinov, R.","Murray, I."],"bibtex":"@inproceedings{ salakhutdinov_quantitative_2008,\n address = {New York, NY, USA},\n series = {{ICML} '08},\n title = {On the {Quantitative} {Analysis} of {Deep} {Belief} {Networks}},\n isbn = {978-1-60558-205-4},\n url = {http://doi.acm.org/10.1145/1390156.1390266},\n doi = {10.1145/1390156.1390266},\n abstract = {Deep Belief Networks (DBN's) are generative models that contain many layers of hidden variables. Efficient greedy algorithms for learning and approximate inference have allowed these models to be applied successfully in many application domains. The main building block of a DBN is a bipartite undirected graphical model called a restricted Boltzmann machine (RBM). Due to the presence of the partition function, model selection, complexity control, and exact maximum likelihood learning in RBM's are intractable. We show that Annealed Importance Sampling (AIS) can be used to efficiently estimate the partition function of an RBM, and we present a novel AIS scheme for comparing RBM's with different architectures. We further show how an AIS estimator, along with approximate inference, can be used to estimate a lower bound on the log-probability that a DBN model with multiple hidden layers assigns to the test data. This is, to our knowledge, the first step towards obtaining quantitative results that would allow us to directly assess the performance of Deep Belief Networks as generative models of data.},\n urldate = {2015-05-03TZ},\n booktitle = {Proceedings of the 25th {International} {Conference} on {Machine} {Learning}},\n publisher = {ACM},\n author = {Salakhutdinov, Ruslan and Murray, Iain},\n year = {2008},\n note = {00129},\n pages = {872--879}\n}","bibtype":"inproceedings","booktitle":"Proceedings of the 25th International Conference on Machine Learning","doi":"10.1145/1390156.1390266","id":"salakhutdinov_quantitative_2008","isbn":"978-1-60558-205-4","key":"salakhutdinov_quantitative_2008","note":"00129","pages":"872--879","publisher":"ACM","series":"ICML '08","title":"On the Quantitative Analysis of Deep Belief Networks","type":"inproceedings","url":"http://doi.acm.org/10.1145/1390156.1390266","urldate":"2015-05-03TZ","year":"2008","bibbaseid":"salakhutdinov-murray-onthequantitativeanalysisofdeepbeliefnetworks-2008","role":"author","urls":{"Paper":"http://doi.acm.org/10.1145/1390156.1390266"},"downloads":0},"search_terms":["quantitative","analysis","deep","belief","networks","salakhutdinov","murray"],"keywords":[],"authorIDs":[],"dataSources":["y8en6y5RHukfeLuPH"]}