Statistical analysis of filled pauses' rhythm for disfluent speech synthesis. Adell, J., Bonafonte, A., & Escudero, D. In SSW6-2007. Proceedings of the Sixth ISCA Tutorial and Research Workshop in Speech Synthesis, pages 223–227, 2007. Paper abstract bibtex Given that state of the art speech synthesis systems have already reached a high naturalness level, it is time to move to talking speech from the actual read speech framework. For this purpose it is thus necessary to investigate how disfluencies can be included in speech synthesis and even increase its naturalness. This paper builds on a previously presented work and focuses on finding a local model of filled pauses rhythm. A statistical study of rhythm effects around filled pauses is presented and based on the correlation between rhythm variables, a regression model is proposed to predict filled pauses duration and prepausal lengthening
@inproceedings{adell_statistical_2007,
Author = {Adell, Jordi and Bonafonte, Antonio and Escudero, David},
Booktitle = {SSW6-2007. Proceedings of the Sixth ISCA Tutorial and Research Workshop in Speech Synthesis},
Date = {2007},
Date-Modified = {2018-05-13 21:46:40 +0000},
Eventdate = {2007-08-22/2007-08-24},
Keywords = {disfluencies, duration, filled pauses, pause duration, pause location, pauses, phonetics, prosody, read speech, rhythm, segmental lengthening, Spanish, speaking styles, speech synthesis, speech technology, temporal factors, text-to-speech},
Location = {Bonn, Germany},
Pages = {223--227},
Title = {Statistical analysis of filled pauses' rhythm for disfluent speech synthesis},
Url = {http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html},
Year = {2007},
Abstract = {Given that state of the art speech synthesis systems have already reached a high naturalness level, it is time to move to talking speech from the actual read speech framework. For this purpose it is thus necessary to investigate how disfluencies can be included in speech synthesis and even increase its naturalness. This paper builds on a previously presented work and focuses on finding a local model of filled pauses rhythm. A statistical study of rhythm effects around filled pauses is presented and based on the correlation between rhythm variables, a regression model is proposed to predict filled pauses duration and prepausal lengthening},
Bdsk-File-1 = {YnBsaXN0MDDUAQIDBAUGJCVYJHZlcnNpb25YJG9iamVjdHNZJGFyY2hpdmVyVCR0b3ASAAGGoKgHCBMUFRYaIVUkbnVsbNMJCgsMDxJXTlMua2V5c1pOUy5vYmplY3RzViRjbGFzc6INDoACgAOiEBGABIAFgAdccmVsYXRpdmVQYXRoWWFsaWFzRGF0YV8QVC4uLy4uLy4uL0JpYmxpb2dyYWZpYS9QYXBlcnMvQWRlbGwvU3RhdGlzdGljYWwgYW5hbHlzaXMgb2YgZmlsbGVkIHBhdXNlcycgcmh5dGhtLnBkZtIXCxgZV05TLmRhdGFPEQI2AAAAAAI2AAIAAAxNYWNpbnRvc2ggSEQAAAAAAAAAAAAAAAAAAADL9h/OSCsAABCGZaofU3RhdGlzdGljYWwgYW5hbHlzIzEwODY2NUFGLnBkZgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAEIZlr9QJ0uUAAAAAAAAAAAADAAQAAAkgAAAAAAAAAAAAAAAAAAAABUFkZWxsAAAQAAgAAMv2A64AAAARAAgAANQJtsUAAAABABQQhmWqEIZljgAF/EcABfuYAADARgACAGNNYWNpbnRvc2ggSEQ6VXNlcnM6AGpvYXF1aW1fbGxpc3RlcnJpOgBCaWJsaW9ncmFmaWE6AFBhcGVyczoAQWRlbGw6AFN0YXRpc3RpY2FsIGFuYWx5cyMxMDg2NjVBRi5wZGYAAA4AZAAxAFMAdABhAHQAaQBzAHQAaQBjAGEAbAAgAGEAbgBhAGwAeQBzAGkAcwAgAG8AZgAgAGYAaQBsAGwAZQBkACAAcABhAHUAcwBlAHMAJwAgAHIAaAB5AHQAaABtAC4AcABkAGYADwAaAAwATQBhAGMAaQBuAHQAbwBzAGgAIABIAEQAEgBjVXNlcnMvam9hcXVpbV9sbGlzdGVycmkvQmlibGlvZ3JhZmlhL1BhcGVycy9BZGVsbC9TdGF0aXN0aWNhbCBhbmFseXNpcyBvZiBmaWxsZWQgcGF1c2VzJyByaHl0aG0ucGRmAAATAAEvAAAVAAIAGP//AACABtIbHB0eWiRjbGFzc25hbWVYJGNsYXNzZXNdTlNNdXRhYmxlRGF0YaMdHyBWTlNEYXRhWE5TT2JqZWN00hscIiNcTlNEaWN0aW9uYXJ5oiIgXxAPTlNLZXllZEFyY2hpdmVy0SYnVHJvb3SAAQAIABEAGgAjAC0AMgA3AEAARgBNAFUAYABnAGoAbABuAHEAcwB1AHcAhACOAOUA6gDyAywDLgMzAz4DRwNVA1kDYANpA24DewN+A5ADkwOYAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAA5o=},
Bdsk-Url-1 = {http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html}}
Downloads: 0
{"_id":"Kb7oTZFfmBaKgZZTu","bibbaseid":"adell-bonafonte-escudero-statisticalanalysisoffilledpausesrhythmfordisfluentspeechsynthesis-2007","downloads":0,"creationDate":"2016-09-21T09:08:37.869Z","title":"Statistical analysis of filled pauses' rhythm for disfluent speech synthesis","author_short":["Adell, J.","Bonafonte, A.","Escudero, D."],"year":2007,"bibtype":"inproceedings","biburl":"https://joaquimllisterri.cat/phonetics/ESTIVOZ/ESTIVOZ.bib","bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"propositions":[],"lastnames":["Adell"],"firstnames":["Jordi"],"suffixes":[]},{"propositions":[],"lastnames":["Bonafonte"],"firstnames":["Antonio"],"suffixes":[]},{"propositions":[],"lastnames":["Escudero"],"firstnames":["David"],"suffixes":[]}],"booktitle":"SSW6-2007. Proceedings of the Sixth ISCA Tutorial and Research Workshop in Speech Synthesis","date":"2007","date-modified":"2018-05-13 21:46:40 +0000","eventdate":"2007-08-22/2007-08-24","keywords":"disfluencies, duration, filled pauses, pause duration, pause location, pauses, phonetics, prosody, read speech, rhythm, segmental lengthening, Spanish, speaking styles, speech synthesis, speech technology, temporal factors, text-to-speech","location":"Bonn, Germany","pages":"223–227","title":"Statistical analysis of filled pauses' rhythm for disfluent speech synthesis","url":"http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html","year":"2007","abstract":"Given that state of the art speech synthesis systems have already reached a high naturalness level, it is time to move to talking speech from the actual read speech framework. For this purpose it is thus necessary to investigate how disfluencies can be included in speech synthesis and even increase its naturalness. This paper builds on a previously presented work and focuses on finding a local model of filled pauses rhythm. A statistical study of rhythm effects around filled pauses is presented and based on the correlation between rhythm variables, a regression model is proposed to predict filled pauses duration and prepausal lengthening","bdsk-file-1":"YnBsaXN0MDDUAQIDBAUGJCVYJHZlcnNpb25YJG9iamVjdHNZJGFyY2hpdmVyVCR0b3ASAAGGoKgHCBMUFRYaIVUkbnVsbNMJCgsMDxJXTlMua2V5c1pOUy5vYmplY3RzViRjbGFzc6INDoACgAOiEBGABIAFgAdccmVsYXRpdmVQYXRoWWFsaWFzRGF0YV8QVC4uLy4uLy4uL0JpYmxpb2dyYWZpYS9QYXBlcnMvQWRlbGwvU3RhdGlzdGljYWwgYW5hbHlzaXMgb2YgZmlsbGVkIHBhdXNlcycgcmh5dGhtLnBkZtIXCxgZV05TLmRhdGFPEQI2AAAAAAI2AAIAAAxNYWNpbnRvc2ggSEQAAAAAAAAAAAAAAAAAAADL9h/OSCsAABCGZaofU3RhdGlzdGljYWwgYW5hbHlzIzEwODY2NUFGLnBkZgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAEIZlr9QJ0uUAAAAAAAAAAAADAAQAAAkgAAAAAAAAAAAAAAAAAAAABUFkZWxsAAAQAAgAAMv2A64AAAARAAgAANQJtsUAAAABABQQhmWqEIZljgAF/EcABfuYAADARgACAGNNYWNpbnRvc2ggSEQ6VXNlcnM6AGpvYXF1aW1fbGxpc3RlcnJpOgBCaWJsaW9ncmFmaWE6AFBhcGVyczoAQWRlbGw6AFN0YXRpc3RpY2FsIGFuYWx5cyMxMDg2NjVBRi5wZGYAAA4AZAAxAFMAdABhAHQAaQBzAHQAaQBjAGEAbAAgAGEAbgBhAGwAeQBzAGkAcwAgAG8AZgAgAGYAaQBsAGwAZQBkACAAcABhAHUAcwBlAHMAJwAgAHIAaAB5AHQAaABtAC4AcABkAGYADwAaAAwATQBhAGMAaQBuAHQAbwBzAGgAIABIAEQAEgBjVXNlcnMvam9hcXVpbV9sbGlzdGVycmkvQmlibGlvZ3JhZmlhL1BhcGVycy9BZGVsbC9TdGF0aXN0aWNhbCBhbmFseXNpcyBvZiBmaWxsZWQgcGF1c2VzJyByaHl0aG0ucGRmAAATAAEvAAAVAAIAGP//AACABtIbHB0eWiRjbGFzc25hbWVYJGNsYXNzZXNdTlNNdXRhYmxlRGF0YaMdHyBWTlNEYXRhWE5TT2JqZWN00hscIiNcTlNEaWN0aW9uYXJ5oiIgXxAPTlNLZXllZEFyY2hpdmVy0SYnVHJvb3SAAQAIABEAGgAjAC0AMgA3AEAARgBNAFUAYABnAGoAbABuAHEAcwB1AHcAhACOAOUA6gDyAywDLgMzAz4DRwNVA1kDYANpA24DewN+A5ADkwOYAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAA5o=","bdsk-url-1":"http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html","bibtex":"@inproceedings{adell_statistical_2007,\n\tAuthor = {Adell, Jordi and Bonafonte, Antonio and Escudero, David},\n\tBooktitle = {SSW6-2007. Proceedings of the Sixth ISCA Tutorial and Research Workshop in Speech Synthesis},\n\tDate = {2007},\n\tDate-Modified = {2018-05-13 21:46:40 +0000},\n\tEventdate = {2007-08-22/2007-08-24},\n\tKeywords = {disfluencies, duration, filled pauses, pause duration, pause location, pauses, phonetics, prosody, read speech, rhythm, segmental lengthening, Spanish, speaking styles, speech synthesis, speech technology, temporal factors, text-to-speech},\n\tLocation = {Bonn, Germany},\n\tPages = {223--227},\n\tTitle = {Statistical analysis of filled pauses' rhythm for disfluent speech synthesis},\n\tUrl = {http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html},\n\tYear = {2007},\n\tAbstract = {Given that state of the art speech synthesis systems have already reached a high naturalness level, it is time to move to talking speech from the actual read speech framework. For this purpose it is thus necessary to investigate how disfluencies can be included in speech synthesis and even increase its naturalness. This paper builds on a previously presented work and focuses on finding a local model of filled pauses rhythm. A statistical study of rhythm effects around filled pauses is presented and based on the correlation between rhythm variables, a regression model is proposed to predict filled pauses duration and prepausal lengthening},\n\tBdsk-File-1 = {YnBsaXN0MDDUAQIDBAUGJCVYJHZlcnNpb25YJG9iamVjdHNZJGFyY2hpdmVyVCR0b3ASAAGGoKgHCBMUFRYaIVUkbnVsbNMJCgsMDxJXTlMua2V5c1pOUy5vYmplY3RzViRjbGFzc6INDoACgAOiEBGABIAFgAdccmVsYXRpdmVQYXRoWWFsaWFzRGF0YV8QVC4uLy4uLy4uL0JpYmxpb2dyYWZpYS9QYXBlcnMvQWRlbGwvU3RhdGlzdGljYWwgYW5hbHlzaXMgb2YgZmlsbGVkIHBhdXNlcycgcmh5dGhtLnBkZtIXCxgZV05TLmRhdGFPEQI2AAAAAAI2AAIAAAxNYWNpbnRvc2ggSEQAAAAAAAAAAAAAAAAAAADL9h/OSCsAABCGZaofU3RhdGlzdGljYWwgYW5hbHlzIzEwODY2NUFGLnBkZgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAEIZlr9QJ0uUAAAAAAAAAAAADAAQAAAkgAAAAAAAAAAAAAAAAAAAABUFkZWxsAAAQAAgAAMv2A64AAAARAAgAANQJtsUAAAABABQQhmWqEIZljgAF/EcABfuYAADARgACAGNNYWNpbnRvc2ggSEQ6VXNlcnM6AGpvYXF1aW1fbGxpc3RlcnJpOgBCaWJsaW9ncmFmaWE6AFBhcGVyczoAQWRlbGw6AFN0YXRpc3RpY2FsIGFuYWx5cyMxMDg2NjVBRi5wZGYAAA4AZAAxAFMAdABhAHQAaQBzAHQAaQBjAGEAbAAgAGEAbgBhAGwAeQBzAGkAcwAgAG8AZgAgAGYAaQBsAGwAZQBkACAAcABhAHUAcwBlAHMAJwAgAHIAaAB5AHQAaABtAC4AcABkAGYADwAaAAwATQBhAGMAaQBuAHQAbwBzAGgAIABIAEQAEgBjVXNlcnMvam9hcXVpbV9sbGlzdGVycmkvQmlibGlvZ3JhZmlhL1BhcGVycy9BZGVsbC9TdGF0aXN0aWNhbCBhbmFseXNpcyBvZiBmaWxsZWQgcGF1c2VzJyByaHl0aG0ucGRmAAATAAEvAAAVAAIAGP//AACABtIbHB0eWiRjbGFzc25hbWVYJGNsYXNzZXNdTlNNdXRhYmxlRGF0YaMdHyBWTlNEYXRhWE5TT2JqZWN00hscIiNcTlNEaWN0aW9uYXJ5oiIgXxAPTlNLZXllZEFyY2hpdmVy0SYnVHJvb3SAAQAIABEAGgAjAC0AMgA3AEAARgBNAFUAYABnAGoAbABuAHEAcwB1AHcAhACOAOUA6gDyAywDLgMzAz4DRwNVA1kDYANpA24DewN+A5ADkwOYAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAA5o=},\n\tBdsk-Url-1 = {http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html}}\n\n","author_short":["Adell, J.","Bonafonte, A.","Escudero, D."],"key":"adell_statistical_2007","id":"adell_statistical_2007","bibbaseid":"adell-bonafonte-escudero-statisticalanalysisoffilledpausesrhythmfordisfluentspeechsynthesis-2007","role":"author","urls":{"Paper":"http://www.isca-speech.org/archive_open/ssw6/ssw6_223.html"},"keyword":["disfluencies","duration","filled pauses","pause duration","pause location","pauses","phonetics","prosody","read speech","rhythm","segmental lengthening","Spanish","speaking styles","speech synthesis","speech technology","temporal factors","text-to-speech"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"search_terms":["statistical","analysis","filled","pauses","rhythm","disfluent","speech","synthesis","adell","bonafonte","escudero"],"keywords":["disfluencies","duration","filled pauses","pause duration","pause location","pauses","phonetics","prosody","read speech","rhythm","segmental lengthening","spanish","speaking styles","speech synthesis","speech technology","temporal factors","text-to-speech"],"authorIDs":[],"dataSources":["qBn3jEfYwFvzHJsYh","BrMmNtBqG9aDvpsZn"]}