@InProceedings{Höge2024_1207,
author = {Harald Höge},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2024},
title = {The Use of Temporal Features in Cortical Segmentation of Syllables},
year = {2024},
editor = {Timo Baumann},
month = mar,
pages = {70--77},
publisher = {TUDpress, Dresden},
abstract = {There is high confidence for the hypothesis that in speech perception the cycles of a θ-oscillation segment the auditory signal into syllables [8]. Yet the functionality of the oscillator generating the θ-oscillation is unknown. We follow the finding that, within an auditory scene, speech is perceived as a stream given by temporal coherence [12]. We work with the hypotheses that the θ-oscillator is driven by temporal features providing this coherence. We propose a new temporal feature called Odistance, which detects the onset of a syllable - the starting point to of a θ-cycle – triggered by the temporal distance from to to the instance of the maximal rise of the loudness curve of the vowel. To extract to from the auditory signal, we use the statistical properties of this distance based on the C-center hypothesis [25], which predicts a close temporal relation of the onset consonants to the onset of a vowel. The statistics are derived from reference O-distance extracted from an articulatory database, where the minima and maxima of the loudness are related to maxima and minima of the lower incisor and tongue tip. To judge the quality of the O-distance extracted from the auditory signal, we regard the temporal deviation of the O-distance to the reference Odistance. Currently we achieve a mean deviation of 34ms.},
isbn = {978-3-95908-325-6},
issn = {0940-6832},
keywords = {Phonetische Untersuchungen},
url = {https://www.essv.de/pdf/2024_70_77.pdf},
doi = {10.35096/othr/pub-7082},
}