@InProceedings{Hussain2014_206,
author = {Zaheer Hussain},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2014.},
title = {Significance of rhythmic duration patterns in German read corpus using cluster analysis},
year = {2014},
editor = {RĂ¼diger Hoffmann},
month = mar,
pages = {217--224},
publisher = {TUDpress, Dresden},
abstract = {Synthesis of natural sounding speech is the greatest challenge in a TexttoSpeech Synthesis (TTS) system. In natural speech, duration, intensity and pitch are dynamically varied which is manifested as rhythm or prosody of speech. If these variations are not recreated, the synthesized speech will sound robotic. Synthesis of good quality speech depends on how well the duration and intonation patterns are imposed on speech segments. The best way to improve naturalness in speech is to mimic the way human brain imposes rhythm. We speak in a particular style by varying the duration of the speech segments in words and phrases as per certain specific duration patterns. Brain might be retrieving the corresponding patterns at the time of speaking for generating a discourse in a particular style such as news reading, bible reading, story telling etc. The main objective of this work is to investigate the existence of rhythmic duration patterns in natural speech using cluster analysis. Speech uttered in German language was taken for analysis. Cluster analysis was done on isolated words in continuous german read speech. Results of cluster analysis when investigated using silhouette plot showed the existence of rhythmic duration patterns in German read speech. The result is evidence to the existence of finite number of clusters of duration patterns in natural German read speech.},
isbn = {978-3-944331-51-5},
issn = {0940-6832},
keywords = {Prosodie und Emotion},
url = {https://www.essv.de/pdf/2014_217_224.pdf},
}