@inproceedings{f976379f898f44af815c8fab0f81c8c9,
title = "NLP-Assisted Pipeline for COVID-19 Core Outcome Set Identification Using ClinicalTrials.gov",
abstract = "Core outcome sets (COS) are necessary to ensure the systematic collection, metadata analysis and sharing the information across studies. However, development of an area-specific clinical research is costly and time consuming. ClinicalTrials.gov, as a public repository, provides access to a vast collection of clinical trials and their characteristics such as primary outcomes. With the growing number of COVID-19 clinical trials, identifying COSs from outcomes of such trials is crucial. This paper introduces a semi-automatic pipeline that can efficiently identify, aggregate and rank the COS from the primary outcomes of COVID-19 clinical trials. Using Natural language processing (NLP) techniques, our proposed pipeline successfully downloads and processes 5090 trials from all over the world and identifies COVID-19-specific outcomes that appeared in more than 1% of the trials. The top-of-the-list outcomes identified by the pipeline are mortality due to COVID-19, COVID-19 infection rate and COVID-19 symptoms.",
keywords = "COVID-19, Core outcome set, Natural language processing (NLP)",
author = "Fatemeh Shah-Mohammadi and Irena Parvanova and Joseph Finkelstein",
note = "Publisher Copyright: {\textcopyright} 2022 International Medical Informatics Association (IMIA) and IOS Press.; 18th World Congress on Medical and Health Informatics: One World, One Health - Global Partnership for Digital Innovation, MEDINFO 2021 ; Conference date: 02-10-2021 Through 04-10-2021",
year = "2022",
month = jun,
day = "6",
doi = "10.3233/SHTI220152",
language = "English",
series = "Studies in Health Technology and Informatics",
publisher = "IOS Press BV",
pages = "622--626",
editor = "Paula Otero and Philip Scott and Martin, {Susan Z.} and Elaine Huesing",
booktitle = "MEDINFO 2021",
address = "Netherlands",
}