A Danish phonetically annotated spontaneous speech corpus (DanPASS). Grønnum, N. Speech Communication, 51(7):594–603, July, 2009.
Paper doi abstract bibtex A corpus is described consisting of non-scripted monologues and dialogues, recorded by 27 speakers, comprising a total of 73,227 running words, corresponding to 9h and 46min of speech. The monologues were recorded as one-way communication with an unseen partner where the speaker performed three different tasks: (s)he described a network consisting of various geometrical shapes in various colours, (s)he guided the listener through four different routes in a virtual city map, and (s)he instructed the listener how to build a house from its individual pieces. The dialogues are replicas of the HCRC map tasks. Annotation is performed in Praat. The sound files are segmented into prosodic phrases, words, and syllables. The files are supplied, in separate interval tiers, with an orthographical representation, detailed part-of-speech tags, simplified part-of-speech tags, a phonemic notation, a semi-narrow phonetic notation, a symbolic representation of the pitch relation between each stressed and post-tonic syllable, and a symbolic representation of the phrasal intonation.
@article{gronnum_danish_2009,
series = {Research {Challenges} in {Speech} {Technology}: {A} {Special} {Issue} in {Honour} of {Rolf} {Carlson} and {Björn} {Granström}},
title = {A {Danish} phonetically annotated spontaneous speech corpus ({DanPASS})},
volume = {51},
issn = {0167-6393},
url = {http://www.sciencedirect.com/science/article/pii/S016763930800174X},
doi = {10.1016/j.specom.2008.11.002},
abstract = {A corpus is described consisting of non-scripted monologues and dialogues, recorded by 27 speakers, comprising a total of 73,227 running words, corresponding to 9h and 46min of speech. The monologues were recorded as one-way communication with an unseen partner where the speaker performed three different tasks: (s)he described a network consisting of various geometrical shapes in various colours, (s)he guided the listener through four different routes in a virtual city map, and (s)he instructed the listener how to build a house from its individual pieces. The dialogues are replicas of the HCRC map tasks. Annotation is performed in Praat. The sound files are segmented into prosodic phrases, words, and syllables. The files are supplied, in separate interval tiers, with an orthographical representation, detailed part-of-speech tags, simplified part-of-speech tags, a phonemic notation, a semi-narrow phonetic notation, a symbolic representation of the pitch relation between each stressed and post-tonic syllable, and a symbolic representation of the phrasal intonation.},
number = {7},
urldate = {2018-10-20},
journal = {Speech Communication},
author = {Grønnum, Nina},
month = jul,
year = {2009},
keywords = {Corpus, Dialogue, Monologue, Phonetic notation, Prosodic labeling, Spontaneous speech},
pages = {594--603},
}
Downloads: 0
{"_id":"GvRp399utoJkXddiT","bibbaseid":"grnnum-adanishphoneticallyannotatedspontaneousspeechcorpusdanpass-2009","author_short":["Grønnum, N."],"bibdata":{"bibtype":"article","type":"article","series":"Research Challenges in Speech Technology: A Special Issue in Honour of Rolf Carlson and Björn Granström","title":"A Danish phonetically annotated spontaneous speech corpus (DanPASS)","volume":"51","issn":"0167-6393","url":"http://www.sciencedirect.com/science/article/pii/S016763930800174X","doi":"10.1016/j.specom.2008.11.002","abstract":"A corpus is described consisting of non-scripted monologues and dialogues, recorded by 27 speakers, comprising a total of 73,227 running words, corresponding to 9h and 46min of speech. The monologues were recorded as one-way communication with an unseen partner where the speaker performed three different tasks: (s)he described a network consisting of various geometrical shapes in various colours, (s)he guided the listener through four different routes in a virtual city map, and (s)he instructed the listener how to build a house from its individual pieces. The dialogues are replicas of the HCRC map tasks. Annotation is performed in Praat. The sound files are segmented into prosodic phrases, words, and syllables. The files are supplied, in separate interval tiers, with an orthographical representation, detailed part-of-speech tags, simplified part-of-speech tags, a phonemic notation, a semi-narrow phonetic notation, a symbolic representation of the pitch relation between each stressed and post-tonic syllable, and a symbolic representation of the phrasal intonation.","number":"7","urldate":"2018-10-20","journal":"Speech Communication","author":[{"propositions":[],"lastnames":["Grønnum"],"firstnames":["Nina"],"suffixes":[]}],"month":"July","year":"2009","keywords":"Corpus, Dialogue, Monologue, Phonetic notation, Prosodic labeling, Spontaneous speech","pages":"594–603","bibtex":"@article{gronnum_danish_2009,\n\tseries = {Research {Challenges} in {Speech} {Technology}: {A} {Special} {Issue} in {Honour} of {Rolf} {Carlson} and {Björn} {Granström}},\n\ttitle = {A {Danish} phonetically annotated spontaneous speech corpus ({DanPASS})},\n\tvolume = {51},\n\tissn = {0167-6393},\n\turl = {http://www.sciencedirect.com/science/article/pii/S016763930800174X},\n\tdoi = {10.1016/j.specom.2008.11.002},\n\tabstract = {A corpus is described consisting of non-scripted monologues and dialogues, recorded by 27 speakers, comprising a total of 73,227 running words, corresponding to 9h and 46min of speech. The monologues were recorded as one-way communication with an unseen partner where the speaker performed three different tasks: (s)he described a network consisting of various geometrical shapes in various colours, (s)he guided the listener through four different routes in a virtual city map, and (s)he instructed the listener how to build a house from its individual pieces. The dialogues are replicas of the HCRC map tasks. Annotation is performed in Praat. The sound files are segmented into prosodic phrases, words, and syllables. The files are supplied, in separate interval tiers, with an orthographical representation, detailed part-of-speech tags, simplified part-of-speech tags, a phonemic notation, a semi-narrow phonetic notation, a symbolic representation of the pitch relation between each stressed and post-tonic syllable, and a symbolic representation of the phrasal intonation.},\n\tnumber = {7},\n\turldate = {2018-10-20},\n\tjournal = {Speech Communication},\n\tauthor = {Grønnum, Nina},\n\tmonth = jul,\n\tyear = {2009},\n\tkeywords = {Corpus, Dialogue, Monologue, Phonetic notation, Prosodic labeling, Spontaneous speech},\n\tpages = {594--603},\n}\n\n","author_short":["Grønnum, N."],"key":"gronnum_danish_2009","id":"gronnum_danish_2009","bibbaseid":"grnnum-adanishphoneticallyannotatedspontaneousspeechcorpusdanpass-2009","role":"author","urls":{"Paper":"http://www.sciencedirect.com/science/article/pii/S016763930800174X"},"keyword":["Corpus","Dialogue","Monologue","Phonetic notation","Prosodic labeling","Spontaneous speech"],"metadata":{"authorlinks":{}},"html":""},"bibtype":"article","biburl":"https://sorensandagersorensen.dk/res/danishgrammar.bib","dataSources":["36DYTpvwhpPPf8eDJ"],"keywords":["corpus","dialogue","monologue","phonetic notation","prosodic labeling","spontaneous speech"],"search_terms":["danish","phonetically","annotated","spontaneous","speech","corpus","danpass","grønnum"],"title":"A Danish phonetically annotated spontaneous speech corpus (DanPASS)","year":2009}