﻿<?xml version="1.0" encoding="UTF-8"?>
<records>
  <record>
    <language>eng</language>
    <publisher>Science and Education Publishing</publisher>
    <journalTitle>American Journal of Epidemiology and Infectious Disease</journalTitle>
    <eissn>2333-1275</eissn>
    <publicationDate>2025-05-08</publicationDate>
    <volume>13</volume>
    <issue>1</issue>
    <startPage>10</startPage>
    <endPage>18</endPage>
    <doi>10.12691/ajeid-13-1-2</doi>
    <publisherRecordId>AJEID20251312</publisherRecordId>
    <documentType>article</documentType>
    <title language="eng">Machine Learning Modeling to Predict COVID seropositivity; AI for Pandemic Preparedness</title>
    <authors>
      <author>
        <name>Apeksha Mewani</name>
        <email>abcdef@gmail.com</email>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>Vincent Jones II</name>
        <affiliationId>2</affiliationId>
      </author>
      <author>
        <name>Alejandro Sanchez</name>
        <affiliationId>3</affiliationId>
      </author>
    </authors>
    <affiliationsList>
      <affiliationName affiliationId="1">Department of Health Equity, Administration, and Technology, Lehman College, CUNY</affiliationName>
      <affiliationName affiliationId="2">Department of Health and Human Performance, York College, CUNY, USA</affiliationName>
      <affiliationName affiliationId="3">School of Medicine, American University of the Caribbean, St. Marteen</affiliationName>
    </affiliationsList>
    <abstract language="eng">This study determines the best machine learning (ML) models to predict the most accurate results in COVID-19 seropositivity using existing data. The study used the New York City Community Health Survey (NYC CHS) 2020 dataset for the analysis, and a predictive modeling approach to develop and select an optimal ML model that would accurately predict COVID-19 seropositivity from various ML algorithms. Thus, the LightGBM was found to have the highest Area Under the Curve and overall test metrics including accuracy, precision, and recall, and was therefore selected as the best-performing machine learning model.</abstract>
    <fullTextUrl format="pdf">https://pubs.sciepub.com/ajeid/13/1/2/ajeid-13-1-2.pdf</fullTextUrl>
    <keywords language="eng">
      <keyword>COVID-19</keyword>
      <keyword>Machine learning</keyword>
      <keyword>emergency preparedness</keyword>
      <keyword>predictive modeling</keyword>
      <keyword>seropositivity</keyword>
      <keyword>health education</keyword>
    </keywords>
  </record>
</records>