@inproceedings{611087d4aa714a5cb78658e94095496a,
title = "F0 range and peak alignment across speakers and emotions",
abstract = "We present an analysis of F0 range and peak alignment in emotional speech from a heterogeneous group of speakers varying in age and gender. Both speaker and emotion had a strong effect on F0 range. Despite these large changes in the F0 trajectory, peak alignment was remarkably stable. Using the Linear Alignment Model (LAM) [1], we show that the effects on alignment of emotion and speaker differences, although statistically significant, are small. This stability results in a conclusion that peak alignment, unlike F0 range, does not appear to carry much information about speaker identity or emotional state. The LAM is effective in that it explains 42% of the variance in peak location on average, and furthermore it predicts the time of F0 peaks with an average RMS error of 12ms.",
keywords = "emotion recognition, human voice, speech analysis, speech synthesis",
author = "Eric Morley and {Van Santen}, Jan and Esther Klabbers and Alexander Kain",
year = "2011",
doi = "10.1109/ICASSP.2011.5947467",
language = "English (US)",
isbn = "9781457705397",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
pages = "4952--4955",
booktitle = "2011 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2011 - Proceedings",
note = "36th IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2011 ; Conference date: 22-05-2011 Through 27-05-2011",
}