@InProceedings{Höge2024_1207,
author = {Harald Höge},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2024},
title = {The Use of Temporal Features in Cortical Segmentation of Syllables},
year = {2024},
editor = {Timo Baumann},
month = mar,
pages = {70--77},
publisher = {TUDpress, Dresden},
abstract = {There is high confidence for the hypothesis that in speech perception the
cycles of a θ-oscillation segment the auditory signal into syllables [8]. Yet the functionality
of the oscillator generating the θ-oscillation is unknown. We follow the finding
that, within an auditory scene, speech is perceived as a stream given by temporal
coherence [12]. We work with the hypotheses that the θ-oscillator is driven by temporal
features providing this coherence. We propose a new temporal feature called Odistance,
which detects the onset of a syllable - the starting point to of a θ-cycle –
triggered by the temporal distance from to to the instance of the maximal rise of the
loudness curve of the vowel. To extract to from the auditory signal, we use the statistical
properties of this distance based on the C-center hypothesis [25], which predicts
a close temporal relation of the onset consonants to the onset of a vowel. The statistics
are derived from reference O-distance extracted from an articulatory database, where
the minima and maxima of the loudness are related to maxima and minima of the lower
incisor and tongue tip. To judge the quality of the O-distance extracted from the auditory
signal, we regard the temporal deviation of the O-distance to the reference Odistance.
Currently we achieve a mean deviation of 34ms.},
isbn = {978-3-95908-325-6},
issn = {0940-6832},
keywords = {Phonetische Untersuchungen},
url = {https://www.essv.de/pdf/2024_70_77.pdf},
doi = {10.35096/othr/pub-7082},
}