Potential of Low-Coverage Genotyping-by-Sequencing and Imputation for Cost-Effective Genomic Selection in Biparental Segregating Populations. Gorjanc, G., Dumasy, J., Gonen, S., Gaynor, R., C., Antolin, R., & Hickey, J., M. Crop Science, 57:1404-1420, The Crop Science Society of America, Inc., 2017.
Potential of Low-Coverage Genotyping-by-Sequencing and Imputation for Cost-Effective Genomic Selection in Biparental Segregating Populations [link]Website  abstract   bibtex   
Genotyping-by-sequencing (GBS) is an alternative genotyping method to single-nucleotide polymorphism (SNP) arrays that has received considerable attention in the plant breeding community. In this study we use simulation to quantify the potential of low-coverage GBS and imputation for cost-effective genomic selection in biparental segregating populations. The simulations comprised a range of scenarios where SNP array or GBS data were used to train the genomic selection model, to predict breeding values, or both. The GBS data were generated with sequencing coverages (x) from 4x to 0.01x. The data were used either nonimputed or imputed by the AlphaImpute program. The size of the training and prediction sets was either held fixed or was increased by reducing sequencing coverage per individual. The results show that nonimputed 1x GBS data provided comparable prediction accuracy and bias, and for the used measurement of return on investment, outperformed the SNP array data. Imputation allowed for further reduction in sequencing coverage, to as low as 0.1x with 10,000 markers or 0.01x with 100,000 markers. The results suggest that using such data in biparental families gave up to 5.63 times higher return on investment than using the SNP array data. Reduction of sequencing coverage per individual and imputation can be leveraged to genotype larger training sets to increase prediction accuracy and larger prediction sets to increase selection intensity, which both allow for higher response to selection and higher return on investment.
@article{
 title = {Potential of Low-Coverage Genotyping-by-Sequencing and Imputation for Cost-Effective Genomic Selection in Biparental Segregating Populations},
 type = {article},
 year = {2017},
 identifiers = {[object Object]},
 pages = {1404-1420},
 volume = {57},
 websites = {http://dx.doi.org/10.2135/cropsci2016.08.0675},
 publisher = {The Crop Science Society of America, Inc.},
 city = {Madison, WI},
 id = {935d4c6c-f61b-398d-9846-dbca18189f57},
 created = {2018-05-03T12:05:19.835Z},
 file_attached = {false},
 profile_id = {9ca27882-2561-35ad-83fc-979e45a13e32},
 group_id = {6e40dffa-27af-331f-992a-70c68bd0c7e9},
 last_modified = {2018-05-03T12:05:19.835Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 source_type = {JOUR},
 language = {English},
 private_publication = {false},
 abstract = {Genotyping-by-sequencing (GBS) is an alternative genotyping method to single-nucleotide polymorphism (SNP) arrays that has received considerable attention in the plant breeding community. In this study we use simulation to quantify the potential of low-coverage GBS and imputation for cost-effective genomic selection in biparental segregating populations. The simulations comprised a range of scenarios where SNP array or GBS data were used to train the genomic selection model, to predict breeding values, or both. The GBS data were generated with sequencing coverages (x) from 4x to 0.01x. The data were used either nonimputed or imputed by the AlphaImpute program. The size of the training and prediction sets was either held fixed or was increased by reducing sequencing coverage per individual. The results show that nonimputed 1x GBS data provided comparable prediction accuracy and bias, and for the used measurement of return on investment, outperformed the SNP array data. Imputation allowed for further reduction in sequencing coverage, to as low as 0.1x with 10,000 markers or 0.01x with 100,000 markers. The results suggest that using such data in biparental families gave up to 5.63 times higher return on investment than using the SNP array data. Reduction of sequencing coverage per individual and imputation can be leveraged to genotype larger training sets to increase prediction accuracy and larger prediction sets to increase selection intensity, which both allow for higher response to selection and higher return on investment.},
 bibtype = {article},
 author = {Gorjanc, Gregor and Dumasy, Jean-Francois and Gonen, Serap and Gaynor, R Chris and Antolin, Roberto and Hickey, John M},
 journal = {Crop Science}
}

Downloads: 0