@inproceedings{c87df12055804c1cbb0f419dc96d3751,
title = "Compression of line spectral frequency parameters with asynchronous interpolation",
abstract = "TTS systems require a trade-off between size and speech quality. A larger acoustic inventory allows synthesis of speech that sounds more natural. The Asynchronous Interpolation Model improves the quality to size ratio, allowing better compression of large acoustic inventories, as well as better quality speech from a small system. At maximum compression, our method represents most phonemes by a single frame of data. Coarticulation effects are specified as contextspecific non-linear interpolation functions. Dividing the speech features into multiple data streams allows asynchronous interpolation. In this study, AIM was applied to LSF parameters. Varying the number of streams allows for variable amount of compression. We used three different objective measures to investigate the effect of number and partitioning of streams. The first few weight functions (and the last one) seem to offer the most error reduction. Partitions separating the first 6 LSFs score well with all three measures.",
keywords = "Acoustic inventory, Compression, Speech synthesis, TTS, Temporal decomposition",
author = "Rachel Moldover and Alexander Kain",
year = "2009",
month = sep,
day = "23",
doi = "10.1109/ICASSP.2009.4960452",
language = "English (US)",
isbn = "9781424423545",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
pages = "3789--3792",
booktitle = "2009 IEEE International Conference on Acoustics, Speech, and Signal Processing - Proceedings, ICASSP 2009",
note = "2009 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2009 ; Conference date: 19-04-2009 Through 24-04-2009",
}