@InProceedings{Noll2004_498,
author = {Peter Noll and Markus Schwab and Wilbert Wiryadi},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2004},
title = {Sensing People - Localization with Microphone Arrays},
year = {2004},
editor = {Klaus Fellbaum},
month = mar,
pages = {11--18},
publisher = {TUDpress, Dresden},
abstract = {In this paper we present a real-time microphone array system which performs 3D
source localization, multi channel speech enhancement and robust speech recognition.
The acoustic source localization uses the SRP-PHAT method [1] to produce
potential source locations. A clustering algorithm excludes outliers and enables
a multi source tracking. The localizations are finally optimally filtered with an
appropriate Kalman filter. The proposed speech enhancement, a weighted subarray
Delay-and-Sum beamformer, is designed to cope with the problem of diffuse
noise and changing speaker positions subject to minimization of the word error rate
(WER) of an automatic speech recognition system (ASR). The proposed algorithm
reduces the WER by more than 50 % compared to the WER of a single microphone
signal.},
isbn = {978-3-937672-65-6},
issn = {0940-6832},
keywords = {Mobile Computing, Ubiquitous Computing und Ambient Intelligence (Hauptvorträge)},
url = {https://www.essv.de/pdf/2004_11_18.pdf},
}