@MISC\{IMM2013-06611, author = "P. P. Henningsen", title = "Application of machine learning in analysis of answers to open-ended questions in survey data", year = "2013", publisher = "Technical University of Denmark, {DTU} Compute, {E-}mail: compute@compute.dtu.dk", address = "Matematiktorvet, Building 303{-B,} {DK-}2800 Kgs. Lyngby, Denmark", url = "http://www.compute.dtu.dk/English.aspx", abstract = "The goal of the thesis is to implement a framework for analyzing answers to open-ended questions in a semi-automated way, thereby lessening the cost of including open-ended questions in a survey. To do this, techniques from the machine learning branch of computer science will be explored. More specifically, a methods known as latent semantic analysis and non-negative matrix factorization will be the focus of the thesis. This techniques will be used to extract topics from the answers, which enables me to cluster the answers according to these topics. The clustering will be done using k-means clustering. To implement all of this, the Python programming language is used." }