Representativeness in Corpus Design. Biber, D. Literary and Linguistic Computing, 8(4):243–257, October, 1993.
Paper doi abstract bibtex The present paper addresses a number of issues related to achieving ‘representativeness’ in linguistic corpus design, including: discussion of what it means to `represent’ a language, definition of the target population, stratified versus proportional sampling of a language, sampling within texts, and issues relating to the required sample size (number of texts) of a corpus. The paper distinguishes among various ways that linguistic features can be distributed within and across texts; it analyzes the distributions of several particular features, and it discusses the implications of these distributions for corpus design.
@article{biber_representativeness_1993,
title = {Representativeness in {Corpus} {Design}},
volume = {8},
issn = {0268-1145, 1477-4615},
url = {https://academic.oup.com/dsh/article-lookup/doi/10.1093/llc/8.4.243},
doi = {10.1093/llc/8.4.243},
abstract = {The present paper addresses a number of issues related to achieving ‘representativeness’ in linguistic corpus design, including: discussion of what it means to `represent’ a language, definition of the target population, stratified versus proportional sampling of a language, sampling within texts, and issues relating to the required sample size (number of texts) of a corpus. The paper distinguishes among various ways that linguistic features can be distributed within and across texts; it analyzes the distributions of several particular features, and it discusses the implications of these distributions for corpus design.},
language = {en},
number = {4},
urldate = {2024-09-04},
journal = {Literary and Linguistic Computing},
author = {Biber, D.},
month = oct,
year = {1993},
pages = {243--257},
}
Downloads: 0
{"_id":"B4cMmfZWP2i94cCAH","bibbaseid":"biber-representativenessincorpusdesign-1993","author_short":["Biber, D."],"bibdata":{"bibtype":"article","type":"article","title":"Representativeness in Corpus Design","volume":"8","issn":"0268-1145, 1477-4615","url":"https://academic.oup.com/dsh/article-lookup/doi/10.1093/llc/8.4.243","doi":"10.1093/llc/8.4.243","abstract":"The present paper addresses a number of issues related to achieving ‘representativeness’ in linguistic corpus design, including: discussion of what it means to `represent’ a language, definition of the target population, stratified versus proportional sampling of a language, sampling within texts, and issues relating to the required sample size (number of texts) of a corpus. The paper distinguishes among various ways that linguistic features can be distributed within and across texts; it analyzes the distributions of several particular features, and it discusses the implications of these distributions for corpus design.","language":"en","number":"4","urldate":"2024-09-04","journal":"Literary and Linguistic Computing","author":[{"propositions":[],"lastnames":["Biber"],"firstnames":["D."],"suffixes":[]}],"month":"October","year":"1993","pages":"243–257","bibtex":"@article{biber_representativeness_1993,\n\ttitle = {Representativeness in {Corpus} {Design}},\n\tvolume = {8},\n\tissn = {0268-1145, 1477-4615},\n\turl = {https://academic.oup.com/dsh/article-lookup/doi/10.1093/llc/8.4.243},\n\tdoi = {10.1093/llc/8.4.243},\n\tabstract = {The present paper addresses a number of issues related to achieving ‘representativeness’ in linguistic corpus design, including: discussion of what it means to `represent’ a language, definition of the target population, stratified versus proportional sampling of a language, sampling within texts, and issues relating to the required sample size (number of texts) of a corpus. The paper distinguishes among various ways that linguistic features can be distributed within and across texts; it analyzes the distributions of several particular features, and it discusses the implications of these distributions for corpus design.},\n\tlanguage = {en},\n\tnumber = {4},\n\turldate = {2024-09-04},\n\tjournal = {Literary and Linguistic Computing},\n\tauthor = {Biber, D.},\n\tmonth = oct,\n\tyear = {1993},\n\tpages = {243--257},\n}\n\n\n\n\n\n\n\n\n\n\n\n","author_short":["Biber, D."],"key":"biber_representativeness_1993","id":"biber_representativeness_1993","bibbaseid":"biber-representativenessincorpusdesign-1993","role":"author","urls":{"Paper":"https://academic.oup.com/dsh/article-lookup/doi/10.1093/llc/8.4.243"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://bibbase.org/zotero/abhishek-p","dataSources":["h7kKWXpJh2iaX92T5"],"keywords":[],"search_terms":["representativeness","corpus","design","biber"],"title":"Representativeness in Corpus Design","year":1993}