@inproceedings{15f4cacf00714d7c8f0a4f6fc17a0da6,
title = "Analyzing historical diagnosis code data from NIH N3C and RECOVER Programs using deep learning to determine risk factors for Long Covid",
abstract = "Post-acute sequelae of SARS-CoV-2 infection (PASC) or Long COVID is an emerging medical condition that has been observed in several patients with a positive diagnosis for COVID-19. Historical Electronic Health Records (EHR) like diagnosis codes, lab results and clinical notes have been analyzed using deep learning and have been used to predict future clinical events. In this paper, we propose an interpretable deep learning approach to analyze historical diagnosis code data from the National COVID Cohort Collective (N3C)1 to find the risk factors contributing to developing Long COVID. Using our deep learning approach, we are able to predict if a patient is suffering from Long COVID from a temporally ordered list of diagnosis codes up to 45 days post the first COVID positive test or diagnosis for each patient, with an accuracy of 70.48%. We are then able to examine the trained model using Gradient-weighted Class Activation Mapping (GradCAM) to give each input diagnoses a score. The highest scored diagnosis were deemed to be the most important for making the correct prediction for a patient. We also propose a way to summarize these top diagnoses for each patient in our cohort and look at their temporal trends to determine which codes contribute towards a positive Long COVID diagnosis.",
keywords = "COVID-19, deep learning, EHR, GradCAM",
author = "Saurav Sengupta and Johanna Loomba and Suchetha Sharma and Brown, {Donald E.} and Lorna Thorpe and Haendel, {Melissa A.} and Chute, {Christopher G.} and Stephanie Hong",
note = "Funding Information: FUNDING STATEMENT This research was funded by the National Institutes of Health (NIH) Agreement OT2HL161847-01. The views and conclusions contained in this document are those of the authors and should not be interpreted as representing the official policies, either expressed or implied, of the NIH. All authors are funded under this mechanism. Also funded by the NIH award UL1TR003015 for the integrated Translational Health Research Institute of Virginia. Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2022 ; Conference date: 06-12-2022 Through 08-12-2022",
year = "2022",
doi = "10.1109/BIBM55620.2022.9994851",
language = "English (US)",
series = "Proceedings - 2022 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2022",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "2797--2802",
editor = "Donald Adjeroh and Qi Long and Xinghua Shi and Fei Guo and Xiaohua Hu and Srinivas Aluru and Giri Narasimhan and Jianxin Wang and Mingon Kang and Mondal, {Ananda M.} and Jin Liu",
booktitle = "Proceedings - 2022 IEEE International Conference on Bioinformatics and Biomedicine, BIBM 2022",
}