A Computable Phenotype Improves Cohort Ascertainment in a Pediatric Pulmonary Hypertension Registry. Geva, A., Gronsbell, J. L., Cai, T., Cai, T., Murphy, S. N., Lyons, J. C., Heinz, M. M., Natter, M. D., Patibandla, N., Bickel, J., Mullen, M. P., Mandl, K. D., Pediatric Pulmonary Hypertension Network, National Heart, L., & Investigators, B. I. P. P. V. D. O. B. C. C. C. The Journal of Pediatrics, 188:224–231.e5, September, 2017. doi abstract bibtex OBJECTIVES: To compare registry and electronic health record (EHR) data mining approaches for cohort ascertainment in patients with pediatric pulmonary hypertension (PH) in an effort to overcome some of the limitations of registry enrollment alone in identifying patients with particular disease phenotypes. STUDY DESIGN: This study was a single-center retrospective analysis of EHR and registry data at Boston Children's Hospital. The local Informatics for Integrating Biology and the Bedside (i2b2) data warehouse was queried for billing codes, prescriptions, and narrative data related to pediatric PH. Computable phenotype algorithms were developed by fitting penalized logistic regression models to a physician-annotated training set. Algorithms were applied to a candidate patient cohort, and performance was evaluated using a separate set of 136 records and 179 registry patients. We compared clinical and demographic characteristics of patients identified by computable phenotype and the registry. RESULTS: The computable phenotype had an area under the receiver operating characteristics curve of 90% (95% CI, 85%-95%), a positive predictive value of 85% (95% CI, 77%-93%), and identified 413 patients (an additional 231%) with pediatric PH who were not enrolled in the registry. Patients identified by the computable phenotype were clinically distinct from registry patients, with a greater prevalence of diagnoses related to perinatal distress and left heart disease. CONCLUSIONS: Mining of EHRs using computable phenotypes identified a large cohort of patients not recruited using a classic registry. Fusion of EHR and registry data can improve cohort ascertainment for the study of rare diseases. TRIAL REGISTRATION: ClinicalTrials.gov: NCT02249923.
@article{geva_computable_2017,
title = {A {Computable} {Phenotype} {Improves} {Cohort} {Ascertainment} in a {Pediatric} {Pulmonary} {Hypertension} {Registry}},
volume = {188},
issn = {1097-6833},
doi = {10.1016/j.jpeds.2017.05.037},
abstract = {OBJECTIVES: To compare registry and electronic health record (EHR) data mining approaches for cohort ascertainment in patients with pediatric pulmonary hypertension (PH) in an effort to overcome some of the limitations of registry enrollment alone in identifying patients with particular disease phenotypes.
STUDY DESIGN: This study was a single-center retrospective analysis of EHR and registry data at Boston Children's Hospital. The local Informatics for Integrating Biology and the Bedside (i2b2) data warehouse was queried for billing codes, prescriptions, and narrative data related to pediatric PH. Computable phenotype algorithms were developed by fitting penalized logistic regression models to a physician-annotated training set. Algorithms were applied to a candidate patient cohort, and performance was evaluated using a separate set of 136 records and 179 registry patients. We compared clinical and demographic characteristics of patients identified by computable phenotype and the registry.
RESULTS: The computable phenotype had an area under the receiver operating characteristics curve of 90\% (95\% CI, 85\%-95\%), a positive predictive value of 85\% (95\% CI, 77\%-93\%), and identified 413 patients (an additional 231\%) with pediatric PH who were not enrolled in the registry. Patients identified by the computable phenotype were clinically distinct from registry patients, with a greater prevalence of diagnoses related to perinatal distress and left heart disease.
CONCLUSIONS: Mining of EHRs using computable phenotypes identified a large cohort of patients not recruited using a classic registry. Fusion of EHR and registry data can improve cohort ascertainment for the study of rare diseases.
TRIAL REGISTRATION: ClinicalTrials.gov: NCT02249923.},
language = {eng},
journal = {The Journal of Pediatrics},
author = {Geva, Alon and Gronsbell, Jessica L. and Cai, Tianxi and Cai, Tianrun and Murphy, Shawn N. and Lyons, Jessica C. and Heinz, Michelle M. and Natter, Marc D. and Patibandla, Nandan and Bickel, Jonathan and Mullen, Mary P. and Mandl, Kenneth D. and {Pediatric Pulmonary Hypertension Network and National Heart, Lung, and Blood Institute Pediatric Pulmonary Vascular Disease Outcomes Bioinformatics Clinical Coordinating Center Investigators}},
month = sep,
year = {2017},
pmid = {28625502},
pmcid = {PMC5572538},
keywords = {Algorithms, Child, Data Mining, Electronic Health Records, Humans, Hypertension, Pulmonary, Phenotype, Predictive Value of Tests, Registries, Retrospective Studies, Sensitivity and Specificity, United States, bioinformatics, computer-based model, pediatrics, pulmonary hypertension, registry},
pages = {224--231.e5},
}
Downloads: 0
{"_id":"ZhuQBk4ajsryRDjph","bibbaseid":"geva-gronsbell-cai-cai-murphy-lyons-heinz-natter-etal-acomputablephenotypeimprovescohortascertainmentinapediatricpulmonaryhypertensionregistry-2017","author_short":["Geva, A.","Gronsbell, J. L.","Cai, T.","Cai, T.","Murphy, S. N.","Lyons, J. C.","Heinz, M. M.","Natter, M. D.","Patibandla, N.","Bickel, J.","Mullen, M. P.","Mandl, K. D.","Pediatric Pulmonary Hypertension Network","National Heart, L.","Investigators, B. I. P. P. V. D. O. B. C. C. C."],"bibdata":{"bibtype":"article","type":"article","title":"A Computable Phenotype Improves Cohort Ascertainment in a Pediatric Pulmonary Hypertension Registry","volume":"188","issn":"1097-6833","doi":"10.1016/j.jpeds.2017.05.037","abstract":"OBJECTIVES: To compare registry and electronic health record (EHR) data mining approaches for cohort ascertainment in patients with pediatric pulmonary hypertension (PH) in an effort to overcome some of the limitations of registry enrollment alone in identifying patients with particular disease phenotypes. STUDY DESIGN: This study was a single-center retrospective analysis of EHR and registry data at Boston Children's Hospital. The local Informatics for Integrating Biology and the Bedside (i2b2) data warehouse was queried for billing codes, prescriptions, and narrative data related to pediatric PH. Computable phenotype algorithms were developed by fitting penalized logistic regression models to a physician-annotated training set. Algorithms were applied to a candidate patient cohort, and performance was evaluated using a separate set of 136 records and 179 registry patients. We compared clinical and demographic characteristics of patients identified by computable phenotype and the registry. RESULTS: The computable phenotype had an area under the receiver operating characteristics curve of 90% (95% CI, 85%-95%), a positive predictive value of 85% (95% CI, 77%-93%), and identified 413 patients (an additional 231%) with pediatric PH who were not enrolled in the registry. Patients identified by the computable phenotype were clinically distinct from registry patients, with a greater prevalence of diagnoses related to perinatal distress and left heart disease. CONCLUSIONS: Mining of EHRs using computable phenotypes identified a large cohort of patients not recruited using a classic registry. Fusion of EHR and registry data can improve cohort ascertainment for the study of rare diseases. TRIAL REGISTRATION: ClinicalTrials.gov: NCT02249923.","language":"eng","journal":"The Journal of Pediatrics","author":[{"propositions":[],"lastnames":["Geva"],"firstnames":["Alon"],"suffixes":[]},{"propositions":[],"lastnames":["Gronsbell"],"firstnames":["Jessica","L."],"suffixes":[]},{"propositions":[],"lastnames":["Cai"],"firstnames":["Tianxi"],"suffixes":[]},{"propositions":[],"lastnames":["Cai"],"firstnames":["Tianrun"],"suffixes":[]},{"propositions":[],"lastnames":["Murphy"],"firstnames":["Shawn","N."],"suffixes":[]},{"propositions":[],"lastnames":["Lyons"],"firstnames":["Jessica","C."],"suffixes":[]},{"propositions":[],"lastnames":["Heinz"],"firstnames":["Michelle","M."],"suffixes":[]},{"propositions":[],"lastnames":["Natter"],"firstnames":["Marc","D."],"suffixes":[]},{"propositions":[],"lastnames":["Patibandla"],"firstnames":["Nandan"],"suffixes":[]},{"propositions":[],"lastnames":["Bickel"],"firstnames":["Jonathan"],"suffixes":[]},{"propositions":[],"lastnames":["Mullen"],"firstnames":["Mary","P."],"suffixes":[]},{"propositions":[],"lastnames":["Mandl"],"firstnames":["Kenneth","D."],"suffixes":[]},{"firstnames":[],"propositions":[],"lastnames":["Pediatric Pulmonary Hypertension Network"],"suffixes":[]},{"propositions":[],"lastnames":["National","Heart"],"firstnames":["Lung"],"suffixes":[""]},{"firstnames":["Blood","Institute","Pediatric","Pulmonary","Vascular","Disease","Outcomes","Bioinformatics","Clinical","Coordinating","Center"],"propositions":[],"lastnames":["Investigators"],"suffixes":[]}],"month":"September","year":"2017","pmid":"28625502","pmcid":"PMC5572538","keywords":"Algorithms, Child, Data Mining, Electronic Health Records, Humans, Hypertension, Pulmonary, Phenotype, Predictive Value of Tests, Registries, Retrospective Studies, Sensitivity and Specificity, United States, bioinformatics, computer-based model, pediatrics, pulmonary hypertension, registry","pages":"224–231.e5","bibtex":"@article{geva_computable_2017,\n\ttitle = {A {Computable} {Phenotype} {Improves} {Cohort} {Ascertainment} in a {Pediatric} {Pulmonary} {Hypertension} {Registry}},\n\tvolume = {188},\n\tissn = {1097-6833},\n\tdoi = {10.1016/j.jpeds.2017.05.037},\n\tabstract = {OBJECTIVES: To compare registry and electronic health record (EHR) data mining approaches for cohort ascertainment in patients with pediatric pulmonary hypertension (PH) in an effort to overcome some of the limitations of registry enrollment alone in identifying patients with particular disease phenotypes.\nSTUDY DESIGN: This study was a single-center retrospective analysis of EHR and registry data at Boston Children's Hospital. The local Informatics for Integrating Biology and the Bedside (i2b2) data warehouse was queried for billing codes, prescriptions, and narrative data related to pediatric PH. Computable phenotype algorithms were developed by fitting penalized logistic regression models to a physician-annotated training set. Algorithms were applied to a candidate patient cohort, and performance was evaluated using a separate set of 136 records and 179 registry patients. We compared clinical and demographic characteristics of patients identified by computable phenotype and the registry.\nRESULTS: The computable phenotype had an area under the receiver operating characteristics curve of 90\\% (95\\% CI, 85\\%-95\\%), a positive predictive value of 85\\% (95\\% CI, 77\\%-93\\%), and identified 413 patients (an additional 231\\%) with pediatric PH who were not enrolled in the registry. Patients identified by the computable phenotype were clinically distinct from registry patients, with a greater prevalence of diagnoses related to perinatal distress and left heart disease.\nCONCLUSIONS: Mining of EHRs using computable phenotypes identified a large cohort of patients not recruited using a classic registry. Fusion of EHR and registry data can improve cohort ascertainment for the study of rare diseases.\nTRIAL REGISTRATION: ClinicalTrials.gov: NCT02249923.},\n\tlanguage = {eng},\n\tjournal = {The Journal of Pediatrics},\n\tauthor = {Geva, Alon and Gronsbell, Jessica L. and Cai, Tianxi and Cai, Tianrun and Murphy, Shawn N. and Lyons, Jessica C. and Heinz, Michelle M. and Natter, Marc D. and Patibandla, Nandan and Bickel, Jonathan and Mullen, Mary P. and Mandl, Kenneth D. and {Pediatric Pulmonary Hypertension Network and National Heart, Lung, and Blood Institute Pediatric Pulmonary Vascular Disease Outcomes Bioinformatics Clinical Coordinating Center Investigators}},\n\tmonth = sep,\n\tyear = {2017},\n\tpmid = {28625502},\n\tpmcid = {PMC5572538},\n\tkeywords = {Algorithms, Child, Data Mining, Electronic Health Records, Humans, Hypertension, Pulmonary, Phenotype, Predictive Value of Tests, Registries, Retrospective Studies, Sensitivity and Specificity, United States, bioinformatics, computer-based model, pediatrics, pulmonary hypertension, registry},\n\tpages = {224--231.e5},\n}\n\n","author_short":["Geva, A.","Gronsbell, J. L.","Cai, T.","Cai, T.","Murphy, S. N.","Lyons, J. C.","Heinz, M. M.","Natter, M. D.","Patibandla, N.","Bickel, J.","Mullen, M. P.","Mandl, K. D.","Pediatric Pulmonary Hypertension Network","National Heart, L.","Investigators, B. I. P. P. V. D. O. B. C. C. C."],"key":"geva_computable_2017-1","id":"geva_computable_2017-1","bibbaseid":"geva-gronsbell-cai-cai-murphy-lyons-heinz-natter-etal-acomputablephenotypeimprovescohortascertainmentinapediatricpulmonaryhypertensionregistry-2017","role":"author","urls":{},"keyword":["Algorithms","Child","Data Mining","Electronic Health Records","Humans","Hypertension","Pulmonary","Phenotype","Predictive Value of Tests","Registries","Retrospective Studies","Sensitivity and Specificity","United States","bioinformatics","computer-based model","pediatrics","pulmonary hypertension","registry"],"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://bibbase.org/zotero/rudypoten","dataSources":["vjYJBNxextb6LkLck","CT2QdQoQtu2wab8TD","YdNQMN8q4Sir34fgi","JGNRjejujgZaT5Woe","Rg7mRMhmZYnCLLEgE","2jPTcmjEXPKsta6A2","M95Ltr7FcMNgDrNnS","aQjY3RHAbbYYbJAHQ"],"keywords":["algorithms","child","data mining","electronic health records","humans","hypertension","pulmonary","phenotype","predictive value of tests","registries","retrospective studies","sensitivity and specificity","united states","bioinformatics","computer-based model","pediatrics","pulmonary hypertension","registry"],"search_terms":["computable","phenotype","improves","cohort","ascertainment","pediatric","pulmonary","hypertension","registry","geva","gronsbell","cai","cai","murphy","lyons","heinz","natter","patibandla","bickel","mullen","mandl","pediatric pulmonary hypertension network","national heart","investigators"],"title":"A Computable Phenotype Improves Cohort Ascertainment in a Pediatric Pulmonary Hypertension Registry","year":2017}