@InProceedings{Elmers2022_1160,
author = {Mikey Elmers},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2022},
title = {Comparing detection methods for pause-internal particles},
year = {2022},
editor = {Oliver Niebuhr and Malin Svensson Lundmark and Heather Weston},
month = mar,
pages = {204--211},
publisher = {TUDpress, Dresden},
abstract = {This study investigates different machine learning architectures for classifying
pause-internal phonetic particles (PINTs), such as filler particles (FPs),
breath noises complementary to silences, and tongue clicks. Many of these PINTs
co-occur, and by modeling them simultaneously, the aim is to improve the classification
accuracy for the surrounding PINTs as well. An annotated subset from a
German spontaneous speech corpus was used for modeling. Mel-frequency cepstral
coefficients were used as inputs to model PINTs with three kinds of neural
networks: a general neural network, a convolutional neural network, and a recurrent
neural network. The models used the same hyperparameters, number of layers,
and number of neurons for those layers, so that the focus was put onto the model
architecture. The recurrent neural network was expected to perform the best since
it is able to capture temporal information; however, all models performed similarly.
The models performed best at classifying silent segments, followed by inhalations
and exhalations. However, all models failed to accurately classify FPs and clicks,
indicating that modeling PINTs simultaneously doesn’t always improve accuracy
for surrounding PINTs. These findings suggest that accurate classification is more
dependent on annotation quantity and quality than model architecture. The main
contributions of this paper are the classification of multiple PINTs simultaneously,
and the improvement of PINTs classification for the German language.},
isbn = {978-3-95908-548-9},
issn = {0940-6832},
keywords = {Signal Processing & Comprehension},
url = {https://www.essv.de/pdf/2022_204_211.pdf},
}