@InProceedings{Evin2010_564,
author = {Diego Evin and Jorge Gurlekian and Humberto Torres},
booktitle = {Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2010},
title = {N-Best Rescoring based on Intonation Prediction for a Spanish ASR System},
year = {2010},
editor = {Hansjörg Mixdorff},
month = mar,
pages = {234--233},
publisher = {TUDpress, Dresden},
abstract = {This paper presents a novel method for rescoring the n-best recognition
hypotheses using intonation knowledge. The model synthesizes the f0 contours for
each of the n-best hypotheses and estimates an intonative matching index between
the synthetic shapes and the real f0 contour. This index is applied in the rescoring
process, and can be viewed as a degree of intonation compatibility between the
hypotheses and the input sentence. The f0 prediction is based on classification and
regression trees and the Fujisaki model. We evaluate our approach using a single
speaker of the Buenos Aires Spanish LIS-SECYT database under clean and babblenoisy
conditions. Considering the systems under no grammar condition, the proposed
model reduces the mean absolute word error rate in 3.1% with respect to the baseline
system, in a consistent manner and under different noise conditions.},
isbn = {978-3-941298-85-9},
issn = {0940-6832},
keywords = {Speech Recognition},
url = {https://www.essv.de/pdf/2010_234_233.pdf},
}