We consider problems involving groups of data, where each observation within a group is
a draw from a mixture model, and where it is desirable to share mixture components between
groups. We assume that the number of mixture components is unknown a priori and is to be
inferred from the data. In this setting it is natural to consider sets of Dirichlet processes, one
for each group, where the well-known clustering property of the Dirichlet process provides a
nonparametric prior for the number of mixture components within each group. Given our desire
to tie the mixture models in the various groups, we consider a hierarchical model, specifically
one in which the base measure for the child Dirichlet processes is itself distributed according to
a Dirichlet process. Such a base measure being discrete, the child Dirichlet processes necessar-
ily share atoms. Thus, as desired, the mixture models in the different groups necessarily share
mixture components. We discuss representations of hierarchical Dirichlet processes in terms of
a stick-breaking process, and a generalization of the Chinese restaurant process that we refer
to as the “Chinese restaurant franchise.” We present Markov chain Monte Carlo algorithms
for posterior inference in hierarchical Dirichlet process mixtures, and describe applications to
problems in information retrieval and text modelling.
%0 Journal Article
%1 teh2006hdp
%A Teh, Y.W.
%A Jordan, M.I.
%A Beal, M.J.
%A Blei, D.M.
%D 2006
%I ASA AMERICAN STATISTICAL ASSOCIATION
%J JOURNAL-AMERICAN STATISTICAL ASSOCIATION
%K hierarchy imported machinelearning model topic
%N 476
%P 1566
%T Hierarchical Dirichlet Processes
%U http://oz.berkeley.edu/tech-reports/653.pdf
%V 101
%X We consider problems involving groups of data, where each observation within a group is
a draw from a mixture model, and where it is desirable to share mixture components between
groups. We assume that the number of mixture components is unknown a priori and is to be
inferred from the data. In this setting it is natural to consider sets of Dirichlet processes, one
for each group, where the well-known clustering property of the Dirichlet process provides a
nonparametric prior for the number of mixture components within each group. Given our desire
to tie the mixture models in the various groups, we consider a hierarchical model, specifically
one in which the base measure for the child Dirichlet processes is itself distributed according to
a Dirichlet process. Such a base measure being discrete, the child Dirichlet processes necessar-
ily share atoms. Thus, as desired, the mixture models in the different groups necessarily share
mixture components. We discuss representations of hierarchical Dirichlet processes in terms of
a stick-breaking process, and a generalization of the Chinese restaurant process that we refer
to as the “Chinese restaurant franchise.” We present Markov chain Monte Carlo algorithms
for posterior inference in hierarchical Dirichlet process mixtures, and describe applications to
problems in information retrieval and text modelling.
@article{teh2006hdp,
abstract = {We consider problems involving groups of data, where each observation within a group is
a draw from a mixture model, and where it is desirable to share mixture components between
groups. We assume that the number of mixture components is unknown a priori and is to be
inferred from the data. In this setting it is natural to consider sets of Dirichlet processes, one
for each group, where the well-known clustering property of the Dirichlet process provides a
nonparametric prior for the number of mixture components within each group. Given our desire
to tie the mixture models in the various groups, we consider a hierarchical model, specifically
one in which the base measure for the child Dirichlet processes is itself distributed according to
a Dirichlet process. Such a base measure being discrete, the child Dirichlet processes necessar-
ily share atoms. Thus, as desired, the mixture models in the different groups necessarily share
mixture components. We discuss representations of hierarchical Dirichlet processes in terms of
a stick-breaking process, and a generalization of the Chinese restaurant process that we refer
to as the “Chinese restaurant franchise.” We present Markov chain Monte Carlo algorithms
for posterior inference in hierarchical Dirichlet process mixtures, and describe applications to
problems in information retrieval and text modelling.},
added-at = {2008-09-09T06:54:05.000+0200},
author = {Teh, Y.W. and Jordan, M.I. and Beal, M.J. and Blei, D.M.},
biburl = {https://www.bibsonomy.org/bibtex/217b5747d496dba6a19e03d5610d9fe2a/tberg},
interhash = {34e30f6d1538ed136344f6a9cf8a791b},
intrahash = {17b5747d496dba6a19e03d5610d9fe2a},
journal = {JOURNAL-AMERICAN STATISTICAL ASSOCIATION},
keywords = {hierarchy imported machinelearning model topic},
number = 476,
pages = 1566,
publisher = {ASA AMERICAN STATISTICAL ASSOCIATION},
timestamp = {2008-09-09T06:54:05.000+0200},
title = {{Hierarchical Dirichlet Processes}},
url = {http://oz.berkeley.edu/tech-reports/653.pdf},
volume = 101,
year = 2006
}