@MASTERSTHESIS\{IMM2003-02551, author = "D. J. Jacobsen", title = "Probabilistic Speech Detection", year = "2003", keywords = "machine learning, classification, voice activity detection, linear networks, independent component analysis, receiver operating characteristics", school = "Informatics and Mathematical Modelling, Technical University of Denmark, {DTU}", address = "Richard Petersens Plads, Building 321, {DK-}2800 Kgs. Lyngby", type = "", note = "Supervisor: Jan Larsen", url = "http://www2.compute.dtu.dk/pubdb/pubs/2551-full.html", abstract = "This thesis deals with the detection of speech in signals that may contain very different noise types, referred to as the 'Voice Activity Detection' (VAD) problem. The signals consist of sections of noise only and sections of speech and noise in an additive mixture; convolutive mixtures are not addressed. Two different probabilistic methods are developed to solve the {VAD} problem. One is a discriminant-function based method in which a linear network with a single logistic output is trained to output the probability of speech presence from a given sound signal. The other is based on modelling of class-conditional probability densities, using Independent Component Analysis (ICA) methods. The algorithms are tested extensively and comparisons are made between them. They are also compared to an industry standard {VAD} algorithm, namely that of the the {ITU-T} G.729B recommendation and one other {VAD}. The results show the crucial importance of considering the type of noise present with the speech for obtaining robust speech detection and that for certain noise types, performance can be bettered with the developed {VAD} algorithms." }