@TECHREPORT\{IMM2005-04340, author = "R. E. Madsen", title = "Approximating The {DCM}", year = "2005", month = "dec", keywords = "dirichlet approximation {DCM}", number = "", series = "", institution = "", address = "", type = "", url = "http://www2.compute.dtu.dk/pubdb/pubs/4340-full.html", abstract = "The Dirichlet compound multinomial (DCM), which has recently been shown to be well suited for modeling for word burstiness in documents, is here investigated. A number of conceptual explanations that account for these recent results, are provided. An exponential family approximation of the {DCM} that is substantially faster to train, while still producing similar probabilities and classification performance is provided." }