@InProceedings{Howard2021_1115,
author = {Ian S. Howard and Julian Mcglashan and Adrian J. Fourcin},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2021},
title = {Machine Learning analysis of speech and EGG for the diagnosis of voice pathology},
year = {2021},
editor = {Stefan Hillmann and Benjamin Weiss and Thilo Michael and Sebastian Möller},
month = mar,
pages = {169--176},
publisher = {TUDpress, Dresden},
abstract = {Current approaches to voice diagnosis involve a clinician examining the patient, listening to their voice and in some cases, using additional measurements of the larynx such as EGG. Here we train a feedforward convolutional neural network on a database of normal healthy drama students recorded speaking passages in English, to reconstruct the associated EGG (Lx) waveform. We then use the network to predict the EGG from the acoustic speech signal on a different set of speakers, including ones that exhibit laryngeal pathologies. We show the predicted EGG is very similar to the actual recorded EGG and, as such, can provide a useful indication of voice pathology. Importantly, the network is able predict the pathological EGG waveforms even though it was never trained on pathological speech.},
isbn = {978-3-959082-27-3},
issn = {0940-6832},
keywords = {Phonetik und Artikulation},
url = {https://www.essv.de/pdf/2021_169_176.pdf},
}