@article{5cfc3de973a1473795973fa2b06aa313,
title = "MedML: Fusing Medical Knowledge and Machine Learning Models for Early Pediatric COVID-19 Hospitalization and Severity Prediction",
abstract = "The COVID-19 pandemic has caused devastating economic and social disruption. This has led to a nationwide call for models to predict hospitalization and severe illness in patients with COVID-19 to inform the distribution of limited healthcare resources. To address this challenge, we propose a machine learning model, MedML, to conduct the hospitalization and severity prediction for the pediatric population using electronic health records. MedML extracts the most predictive features based on medical knowledge and propensity scores from over 6 million medical concepts and incorporates the inter-feature relationships in medical knowledge graphs via graph neural networks. We evaluate MedML on the National Cohort Collaborative (N3C) dataset. MedML achieves up to a 7% higher AUROC and 14% higher AUPRC compared to the best baseline machine learning models. MedML is a new machine learnig framework to incorporate clinical domain knowledge and is more predictive and explainable than current data-driven methods.",
keywords = "Artificial intelligence, Artificial intelligence applications, Pediatrics, Respiratory medicine",
author = "{N3C consortium} and Junyi Gao and Chaoqi Yang and Joerg Heintz and Scott Barrows and Elise Albers and Mary Stapel and Sara Warfield and Adam Cross and Jimeng Sun",
note = "Funding Information: This work was supported by NCATS U24 TR002306 , NSF award SCH-2014438 , PPoSS 2028839 , IIS-1838042 , NIH award R01 1R01NS107291-01 . We acknowledge support from an ARCHES grant provided by The University of Illinois and OSF HealthCare . This project has been funded by the Jump ARCHES endowment through the Health Care Engineering Systems Center . The analysis described in this work was conducted in support from the Department of Health and Human Services , Office of the Assistant Secretary for Preparedness and Response, Biomedical Advanced Research and Development Authority 2021 Pediatric COVID-19 Data Challenge. The content is solely the responsibility of the authors and does not necessarily represent the official views of the N3C Program, the NIH or other funders. The analyses described in this publication were conducted with data or tools accessed through the NCATS N3C Data Enclave ( National COVID Cohort Collaborative, 2022b ) and N3C Attribution & Publication Policy v 1.2-2020-08-25b. The N3C data transfer to NCATS is performed under a Johns Hopkins University Reliance Protocol # IRB00249128 or individual site agreements with NIH. In addition, access to N3C Data Enclave resources does not imply endorsement of the research project and/or results by NIH or NCATS. This research was possible because of the patients whose information is included within the data and the organizations ( National COVID Cohort Collaborative, 2022a ) and scientists who have contributed to the ongoing development of this community resource ( Haendel et al., 2021 ). We gratefully acknowledge the following core contributors to N3C: Anita Walden, Leonie Misquitta, Joni L. Rutter, Kenneth R. Gersing, Penny Wung Burgoon, Samuel Bozzette, Mariam Deacy, Christopher Dillon, Rebecca Erwin-Cohen, Nicole Garbarini, Valery Gordon, Michael G. Kurilla, Emily Carlson Marti, Sam G. Michael, Lili Portilla, Clare Schmitt, Meredith Temple-O'Connor, David A. Eichmann, Warren A. Kibbe, Hongfang Liu, Philip R.O. Payne, Emily R. Pfaff, Peter N. Robinson, Joel H. Saltz, Heidi Spratt, Justin Starren, Christine Suver, Adam B. Wilcox, Andrew E. Williams, Chunlei Wu, Davera Gabriel, Stephanie S. Hong, Kristin Kostka, Harold P. Lehmann, Michele Morris, Matvey B. Palchuk, Xiaohan Tanner Zhang, Richard L. Zhu, Benjamin Amor, Mark M. Bissell, Marshall Clark, Andrew T. Girvin, Stephanie S. Hong, Kristin Kostka, Adam M. Lee, Robert T. Miller, Michele Morris, Matvey B. Palchuk, Kellie M. Walters, Will Cooper, Patricia A. Francis, Rafael Fuentes, Alexis Graves, Julie A. McMurry, Shawn T. O'Neil, Usman Sheikh, Elizabeth Zampino, Katie Rebecca Bradwell, Andrew T. Girvin, Amin Manna, Nabeel Qureshi, Richard Moffitt, Christine Suver, Julie A. McMurry, Carolyn Bramante, Jeremy Richard Harper, Wenndy Hernandez, Farrukh M Koraishy, Amit Saha, Satyanarayana Vedula, Johanna Loomba, Andrea Zhou, Steve Johnson, Evan French, Alfred (Jerrod) Anzalone, Umit Topaloglu, Amy Olex, Hythem Sidkey. Details of contributions available at covid.cd2h.org/acknowledgments. We acknowledge the following institutions whose data is released or pending: Publisher Copyright: {\textcopyright} 2022 The Author(s)",
year = "2022",
month = sep,
day = "16",
doi = "10.1016/j.isci.2022.104970",
language = "English (US)",
volume = "25",
pages = "104970",
journal = "iScience",
issn = "2589-0042",
publisher = "Elsevier Inc.",
number = "9",
}