<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i9e29413</article-id>
      <article-id pub-id-type="pmid">34517338</article-id>
      <article-id pub-id-type="doi">10.2196/29413</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Tracking Self-reported Symptoms and Medical Conditions on Social Media During the COVID-19 Pandemic: Infodemiological Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sanchez</surname>
            <given-names>Travis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Guntuku</surname>
            <given-names>Sharath</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Guntuku</surname>
            <given-names>Sharath Chandra</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Han</surname>
            <given-names>Jin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Ding</surname>
            <given-names>Qinglan</given-names>
          </name>
          <degrees>MBBS, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7431-0288</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Massey</surname>
            <given-names>Daisy</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9922-7808</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Chenxi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8624-4652</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Grady</surname>
            <given-names>Connor B</given-names>
          </name>
          <degrees>MPH</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8407-846X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Yuan</given-names>
          </name>
          <degrees>ScD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5264-2169</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Cohen</surname>
            <given-names>Alina</given-names>
          </name>
          <degrees>MSc, MBA</degrees>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4250-3111</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Matzner</surname>
            <given-names>Pini</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1181-7708</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Mahajan</surname>
            <given-names>Shiwani</given-names>
          </name>
          <degrees>MBBS, MHS</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5617-489X</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Caraballo</surname>
            <given-names>César</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4557-9437</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Kumar</surname>
            <given-names>Navin</given-names>
          </name>
          <degrees>MPhil</degrees>
          <xref rid="aff06" ref-type="aff">6</xref>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4502-069X</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Xue</surname>
            <given-names>Yuchen</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff08" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3658-0505</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Dreyer</surname>
            <given-names>Rachel</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2861-1383</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Roy</surname>
            <given-names>Brita</given-names>
          </name>
          <degrees>MD, MPH, MHS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3782-0104</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Krumholz</surname>
            <given-names>Harlan M</given-names>
          </name>
          <degrees>MD, SM</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <address>
            <institution>Center for Outcomes Research and Evaluation</institution>
            <institution>Yale New Haven Hospital</institution>
            <addr-line>1 Church Street, Suite 200</addr-line>
            <addr-line>New Haven, CT, 06510</addr-line>
            <country>United States</country>
            <fax>1 203 764 5653</fax>
            <phone>1 203 764 5885</phone>
            <email>harlan.krumholz@yale.edu</email>
          </address>
          <xref rid="aff04" ref-type="aff">4</xref>
          <xref rid="aff11" ref-type="aff">11</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2046-127X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>Center for Outcomes Research and Evaluation</institution>
        <institution>Yale New Haven Hospital</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>College of Health and Human Sciences</institution>
        <institution>Purdue University</institution>
        <addr-line>West Lafayette, IN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Department of Chronic Disease Epidemiology</institution>
        <institution>Yale School of Public Health</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>Section of Cardiovascular Medicine</institution>
        <institution>Department of Internal Medicine</institution>
        <institution>Yale School of Medicine</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>Skai</institution>
        <addr-line>Tel-Aviv</addr-line>
        <country>Israel</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>Department of Sociology</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Institute for Network Science</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Foundation for a Smoke-Free World</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Department of Emergency Medicine</institution>
        <institution>Yale School of Medicine</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Department of Medicine</institution>
        <institution>Yale School of Medicine</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff11">
        <label>11</label>
        <institution>Department of Health Policy and Management</institution>
        <institution>Yale School of Public Health</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Harlan M Krumholz <email>harlan.krumholz@yale.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>28</day>
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <volume>7</volume>
      <issue>9</issue>
      <elocation-id>e29413</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>12</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>6</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>26</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Qinglan Ding, Daisy Massey, Chenxi Huang, Connor B Grady, Yuan Lu, Alina Cohen, Pini Matzner, Shiwani Mahajan, César Caraballo, Navin Kumar, Yuchen Xue, Rachel Dreyer, Brita Roy, Harlan M Krumholz. Originally published in JMIR Public Health and Surveillance (https://publichealth.jmir.org), 28.09.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on https://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://publichealth.jmir.org/2021/9/e29413" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Harnessing health-related data posted on social media in real time can offer insights into how the pandemic impacts the mental health and general well-being of individuals and populations over time.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to obtain information on symptoms and medical conditions self-reported by non-Twitter social media users during the COVID-19 pandemic, to determine how discussion of these symptoms and medical conditions changed over time, and to identify correlations between frequency of the top 5 commonly mentioned symptoms post and daily COVID-19 statistics (new cases, new deaths, new active cases, and new recovered cases) in the United States.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used natural language processing (NLP) algorithms to identify symptom- and medical condition–related topics being discussed on social media between June 14 and December 13, 2020. The sample posts were geotagged by NetBase, a third-party data provider. We calculated the positive predictive value and sensitivity to validate the classification of posts. We also assessed the frequency of health-related discussions on social media over time during the study period, and used Pearson correlation coefficients to identify statistically significant correlations between the frequency of the 5 most commonly mentioned symptoms and fluctuation of daily US COVID-19 statistics.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Within a total of 9,807,813 posts (nearly 70% were sourced from the United States), we identified a discussion of 120 symptom-related topics and 1542 medical condition–related topics. Our classification of the health-related posts had a positive predictive value of over 80% and an average classification rate of 92% sensitivity. The 5 most commonly mentioned symptoms on social media during the study period were anxiety (in 201,303 posts or 12.2% of the total posts mentioning symptoms), generalized pain (189,673, 11.5%), weight loss (95,793, 5.8%), fatigue (91,252, 5.5%), and coughing (86,235, 5.2%). The 5 most discussed medical conditions were COVID-19 (in 5,420,276 posts or 66.4% of the total posts mentioning medical conditions), unspecified infectious disease (469,356, 5.8%), influenza (270,166, 3.3%), unspecified disorders of the central nervous system (253,407, 3.1%), and depression (151,752, 1.9%). Changes in posts in the frequency of anxiety, generalized pain, and weight loss were significant but negatively correlated with daily new COVID-19 cases in the United States (r=-0.49, r=-0.46, and r=-0.39, respectively; <italic>P</italic>&#60;.05). Posts on the frequency of anxiety, generalized pain, weight loss, fatigue, and the changes in fatigue positively and significantly correlated with daily changes in both new deaths and new active cases in the United States (r ranged=0.39-0.48; <italic>P</italic>&#60;.05).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>COVID-19 and symptoms of anxiety were the 2 most commonly discussed health-related topics on social media from June 14 to December 13, 2020. Real-time monitoring of social media posts on symptoms and medical conditions may help assess the population’s mental health status and enhance public health surveillance for infectious disease.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>health conditions</kwd>
        <kwd>symptoms</kwd>
        <kwd>mental health</kwd>
        <kwd>social media</kwd>
        <kwd>infoveillance</kwd>
        <kwd>public health surveillance</kwd>
        <kwd>COVID-19</kwd>
        <kwd>pandemic</kwd>
        <kwd>natural language processing</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The COVID-19 pandemic continues to spread worldwide, with more than 229 million confirmed cases and 4,7028,286 deaths in 188 countries as of September 21, 2021 [<xref ref-type="bibr" rid="ref1">1</xref>]. As individuals are being encouraged to telecommute and self-quarantine, social media usage has surged by over 40%, emerging as a powerful tool for facilitating communication and disseminating information in a timely manner [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. The general public and health care professionals use social media platforms for health surveillance; to share their feelings, opinions, knowledge, and experiences in relation to the COVID-19 pandemic; and interact with others who share similar characteristics or interests [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. A growing number of people also use social media to seek and share health information that might otherwise be “invisible” to clinicians and medical researchers (eg, self-diagnosis and self-treated symptoms with over-the-counter medications) [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Harnessing publicly available health-related data posted on social media in real time has the potential to offer insights into how the pandemic impacts the mental health and general well-being of individuals and populations over time [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Although prior studies have demonstrated that social media discussions can influence health-related beliefs and behaviors, more studies are needed to understand how social media plays a role during the pandemic [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Since the emergence of the COVID-19 pandemic, an estimated 41% of US adults have delayed or avoided urgent and routine medical care during the pandemic owing to concerns about COVID-19 [<xref ref-type="bibr" rid="ref13">13</xref>]. Real-time information regarding self-reported general health status at a population level is lacking. Most literature in this area of research has been focused particularly on mental health or COVID-19 symptoms, with Twitter frequently being utilized as the sole data source [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. There was limited information regarding health-related discussions from social media sites other than Twitter. Furthermore, the predictive value of posts on COVID-19 symptoms or related medical conditions on social media sites other than Twitter has not yet been ascertained [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Extracting and analyzing health-related data from multiple social media sources might provide novel ways of measuring the health status and the full spectrum of symptoms and illness of the population in real time [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>As such, we created a dashboard to extract and monitor posts mentioning symptoms and medical conditions from social media sites other than Twitter over the course of the COVID-19 pandemic. In this study, we sought to answer the following questions: (1) what symptoms and medical conditions were people discussing on social media platforms other than Twitter during the COVID-19 pandemic? (2) How have discussions of symptoms and medical conditions on social media changed over a 6-month period during the pandemic? (3) Were daily fluctuations in health-related social media conversations associated with daily changes in COVID-19 statistics (new cases, new deaths, new active cases, and new recovered cases) in the United States?</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <p>We included English-language social networks and forums worldwide, such as Facebook public pages, Reddit, 4Chan, and the comments sections of news sites such as ABC News [<xref ref-type="bibr" rid="ref23">23</xref>]. We defined forums as thread-based message boards and topic-specific pages [<xref ref-type="bibr" rid="ref24">24</xref>]. We chose these sources to provide diversity because they have been studied less than Twitter in this area [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Additionally, the user base profile of our sources appeared to be more representative of the demographic profile of the broader US population than Twitter. While both Twitter and Reddit were popular among US adults aged ≤30 years, those who lived in urban areas, and were male [<xref ref-type="bibr" rid="ref27">27</xref>], Facebook appeared to be more popular among female users and US adults older than 30 years [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <p>Furthermore, even though there is an overlap between the affordance among our sources and Twitter, Reddit users have more anonymity as they do not need to register an account to access the majority of the content, thus allowing for greater participation [<xref ref-type="bibr" rid="ref25">25</xref>]. Lastly, forums such as Reddit allow lengthy submissions and are usually topic-specific, which grant opportunities to cover the sensitive topics of our study (eg, mental health disorders and symptoms), which may not typically be discussed on social media [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. The greater the length of the comments (eg, 40 words per comment for Reddit vs &#60;15 words in tweets, on average) and less frequent use of hashtags associated with forums, which also makes it possible to apply more complex natural language processing (NLP) algorithms more accurately to classify sample posts [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>We partnered with Signals Analytics, an advanced analytics company, to obtain access to target data sources from a third-party data vendor (NetBase) and to conduct the analysis [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. In order to geotag posts, NetBase used a combination of geotagged social media messages, author profiles, and each country’s unique website domain suffix (eg, “.ca” for Canada). All the acquired data were then deidentified by NetBase and transferred to Signals Analytics for analysis.</p>
        <p>We also gathered data on COVID-19 cases from the COVID-19 dashboard developed by the Center for System Science and Engineering at Johns Hopkins University, which provides the most comprehensive and up-to-date information on COVID-19 trends [<xref ref-type="bibr" rid="ref1">1</xref>]. Using the RapidAPI application programming interface (API) [<xref ref-type="bibr" rid="ref31">31</xref>], we updated the COVID-19 statistics (daily new cases or incidence) on a daily basis.</p>
        <p>In this study, all personal identifying information such as usernames, emails, and IP addresses were removed before analysis. The study was exempt from institutional review board review at Yale University as it used publicly available, anonymized data.</p>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>For the analysis of data on symptoms and medical conditions being discussed on social media platforms between June 14 (when many countries began to lift major COVID-19 restrictions) and December 13, 2020 (when the first shipment of the COVID-19 vaccine arrived in the United States), we began by applying NLP algorithms to process social media posts collected from data sources during the study period, and then classified these posts in accordance with symptoms and medical conditions being mentioned.</p>
        <p>To accomplish this, NetBase ran a daily scheduled data extraction query that we designed for the study on over 300 million web-based data sources (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Additionally, we performed the following filtering steps to include posts relevant to our research questions. First, NLP algorithms were run, and advertisements and posts on sites for pornography were removed (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Next, we applied a taxonomy of over 3000 health-related topics to identify key words, phrases, and statements mentioning symptoms and medical conditions (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Social media posts that did not contain any of the taxonomy terms or symptoms and medical conditions as keywords were then deleted. Lastly, we removed redundant posts, blog posts, and news articles to ensure that the analysis was based on unique posts from social networks, forums, and comments only.</p>
        <p>To evaluate the performance of the NLP algorithms and taxonomy classifications of symptoms and medical conditions, we applied the taxonomy to 4 sets of independent 100-post samples and calculated the positive predictive value and sensitivity of the classification (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The algorithms used to identify symptoms and medical conditions topics in our study have been previously validated using real-world data to assess the public’s behaviors and perceptions toward COVID-19 [<xref ref-type="bibr" rid="ref32">32</xref>]. Our study methodology has also been used to provide insights into the characterization and prediction of e-cigarette or vaping product use–associated lung injury outbreaks, known as the EVALI study [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
        <p>Our taxonomy was organized into three levels: categories, subcategories, and topics. Symptoms and medical conditions were the 2 main categories in the taxonomy (<xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The symptoms category included 98 non–COVID-19 topics (symptoms), which were grouped into 7 subcategories based on the affected organ or systems (eg, cardiovascular or respiratory systems). A list of 22 COVID-19–related topics (symptoms) was included as a separate symptom subcategory. The list of COVID-19–related symptoms was defined as outlined by the Centers for Disease Control and Prevention (CDC) on December 22, 2020 [<xref ref-type="bibr" rid="ref34">34</xref>]. Because our algorithms captured all posts that mentioned any of the listed COVID-19 symptoms in the COVID-19–related symptom subcategory, the included posts may not necessarily represent discussions of symptoms experienced by patients with COVID-19. The medical condition category included 2200 topics (medical diagnoses), which were grouped into 10 subcategories. Categories, subcategories, and topics in the taxonomy were not mutually exclusive; each post could be assigned to multiple categories, subcategories, or topics.</p>
        <p>We also created content filters to retain posts mentioning COVID-19 for further analysis. We applied 2 filters, COVID-19 disease status and COVID-19 diagnostic methods, to identify discussions on COVID-19 disease status (tested positive or negative, symptomatic or asymptomatic, recovered, and exposed to a confirmed patient) and diagnostic methods (COVID-19 testing, self-diagnosis, and remote diagnosis). These more restrictive searches were conducted by activating the 2 additional filters using the NLP algorithm, and the resulting posts from that search may not indicate the author’s COVID-19 status.</p>
        <p>To explore how the discussion of symptoms and medical conditions on social media changed from June 14 to December 13, 2020, we determined the number of posts that included a discussion of each symptom and medical condition over time using NLP classification (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). To assess whether the frequency of symptom posts was associated with daily COVID-19 statistics, we performed Pearson correlation analysis to determine correlations among the top 5 most discussed symptoms and daily COVID-19 statistics (new cases, new deaths, new active cases [total cases minus recovered and those who have died], and new recovered cases). Additionally, we calculated Pearson correlation coefficients between frequency changes in each of the 5 symptoms and daily fluctuation in any COVID-19 statistic. A 2-tailed <italic>P</italic> value of &#60;.05 was used to indicate statistical significance. Both posts and COVID-19 statistics used in these analyses were restricted to the United States.</p>
        <p>Additionally, we compared the trends of the 5 most frequently mentioned symptoms and medical conditions from June 14 to August 31, 2021 (when the United States crossed the 6 million COVID-19 cases mark), to the trends observed from September 1 to December 13, 2020, by measuring the percent change between the 2 time periods in the number of posts including a discussion of each topic. We compared the 2 time periods to reveal changes in health-related conversations on social media at different stages of the pandemic, as prior literature focused primarily on the early stage of the pandemic (before June 2020). Our approach was also designed to contribute to a better understanding of the impact of COVID-19 on the public’s perceptions and attitudes toward different symptoms, medical conditions, and health care–seeking behaviors.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>After social media posts were collected from sources, preprocessed, and classified in accordance with the taxonomy by NLP algorithms, our final sample included a total of 9,807,813 posts between June 14 and December 13, 2020, which mentioned at least 1 of the 120 symptoms or 1542 medical condition topics in our taxonomy (<xref ref-type="table" rid="table1">Table 1</xref>). Our taxonomy classification in the independent sample of 100 posts resulted in a positive predictive value of over 80% and an average classification rate of 92% sensitivity. Furthermore, based on indirect geotagging information provided by NetBase, approximately 70% of all posts collected by the search query were from the United States. The most prevalent symptom subcategory was “neuropsychological symptoms” (568,662/ 1,649,547, 34.5%), followed by the COVID-19–related symptoms subcategory (501,178/1,649,547, 30.4%). The most prevalent medical condition subcategory was “infectious disease” (6,052,068/8,158,266, 74.2%), followed by the subcategory of “psychiatric or mental health disorders” (484,505/8,158,266, 6.0%) (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
      <p>Irrespective of subcategories classification, the 5 most commonly mentioned symptom topics were anxiety (201,303, 12.20%, of the total posts mentioning symptoms), generalized pain (189,673, 11.5%), weight loss (95,793, 5.8%), fatigue (91,252, 5.5%), and coughing (86,235, 5.2%), accounting for 40.2% of all symptom posts combined (<xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The 5 most discussed medical condition topics were COVID-19 (5,420,276, 66.4%, of the total posts mentioning medical conditions), unspecified infectious disease (469,356, 5.8%), influenza (270,166, 3.3%), unspecified disorders of the central nervous system (CNS) (253,407, 3.1%), and depression (151,752, 1.9%), and together they accounted for 80.5% of all medical conditions discussed on social media during the study period (<xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Number of posts on symptoms and medical conditions mentioned on social media platforms by taxonomy topic (June 14 to December 13, 2020; N=9,807,813).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="470"/>
          <col width="250"/>
          <col width="250"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Relevant taxonomy categories and subcategories (number of topics)</td>
              <td>Number of posts with symptoms or medical conditions</td>
              <td>Percentage of all posts on symptoms or all medical conditions (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="4">
                <bold>Symptoms (n=1,649,547)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Neuropsychological symptoms (17)</td>
              <td>568,662</td>
              <td>34.47</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>COVID-19–related symptoms<sup>a</sup> (22)</td>
              <td>501,178</td>
              <td>30.38</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Respiratory symptoms (7)</td>
              <td>128,134</td>
              <td>7.77</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Gastrointestinal symptoms (13)</td>
              <td>120,621</td>
              <td>7.31</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Dermal symptoms (16)</td>
              <td>99,453</td>
              <td>6.03</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Cardiovascular disease symptoms (4)</td>
              <td>34,014</td>
              <td>2.06</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Musculoskeletal symptoms (7)</td>
              <td>33,604</td>
              <td>2.04</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Other symptoms (34)</td>
              <td>163,881</td>
              <td>9.93</td>
            </tr>
            <tr valign="top">
              <td colspan="4">
                <bold>Medical conditions (n=8,158,266)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Infectious disease (80)</td>
              <td>6,052,068</td>
              <td>74.18</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Psychiatric or mental health disorders (21)</td>
              <td>484,505</td>
              <td>5.94</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Neurovascular and cardiovascular diseases (63)</td>
              <td>465,675</td>
              <td>5.71</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Respiratory disorders (17)</td>
              <td>165,404</td>
              <td>2.03</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Hematological and oncological disorders (127)</td>
              <td>164,159<break/>  <break/>  </td>
              <td>2.01</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Other disorders (1234)</td>
              <td>828,786</td>
              <td>10.13</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>COVID-19–related symptoms were based on symptoms of COVID-19 (n=22) updated by the Centers for Disease Control and Prevention on December 22, 2020, which were as follows: runny nose, change in sense of taste, change in sense of smell, chills, bluish lips/face, inability to stay awake, fatigue, headache, sore throat, abdominal pain, vomiting, muscle pain/spasms, drowsiness, nausea, body aches, chest pain, itching/swelling, fever, confusion state, diarrhea, coughing, and difficulty breathing.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Frequency of the top 5 most discussed symptoms and medical conditions on social media by taxonomy topic (June 14 to December 13, 2020; N=9,807,813).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="470"/>
          <col width="250"/>
          <col width="250"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Relevant taxonomy categories and topics</td>
              <td>Number of posts with topics related to symptoms or medical conditions</td>
              <td>Percentage of posts on all topics related to symptoms or all medical conditions (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="4">
                <bold>Symptoms (n=1,649,547)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Anxiety</td>
              <td>201,303</td>
              <td>12.20</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Generalized pain</td>
              <td>189,673</td>
              <td>11.49</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Weight loss</td>
              <td>95,793</td>
              <td>5.81</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Fatigue</td>
              <td>91,252</td>
              <td>5.53</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Coughing</td>
              <td>86,235</td>
              <td>5.23</td>
            </tr>
            <tr valign="top">
              <td colspan="4">
                <bold>Medical conditions (n=8,158,266)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>COVID-19</td>
              <td>5,420,276</td>
              <td>66.44</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Unspecified infectious disease</td>
              <td>469,356</td>
              <td>5.75</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Influenza</td>
              <td>270,166</td>
              <td>3.31</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Unspecified CNS<sup>a</sup> disorders</td>
              <td>253,407</td>
              <td>3.11</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Depression</td>
              <td>151,752</td>
              <td>1.86</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>CNS: central nervous system.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>Within the COVID-19–related symptoms subcategory, fatigue (91,208, 32.9%) and coughing (86,222, 31.1%) were the most discussed COVID-19–related symptom topics (<xref ref-type="table" rid="table3">Table 3</xref>). Bluish lips/face (1019, 0.4%) and inability to stay awake (486, 0.2%) were the least commonly discussed COVID-19 symptoms.</p>
      <p>After applying the COVID-19 disease status filter to all posts mentioning the top 5 most frequently mentioned symptoms and medical conditions, we noticed that within the posts classified with the medical condition of COVID-19, 62.9% had also discussed testing positive, and 9.1% of the discussions were related to asymptomatic COVID-19 (Table S2, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Applying the COVID-19 diagnostic method filter revealed that the most popular COVID-19 diagnostic methods discussed were COVID-19 tests regardless of the symptom or medical condition subcategory (Table S2, <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <p>The pattern of changes in top 5 commonly mentioned posts of medical conditions or symptoms and the fluctuation of daily new COVID-19 cases in the United States were displayed in <xref rid="figure1" ref-type="fig">Figures 1</xref> and <xref rid="figure2" ref-type="fig">2</xref>. We noticed a significant increase in daily frequency of posts mentioning the top 5 symptom- and medical condition–related topics in October 2020 and a decrease in late November-December 2020 (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Statistical analysis showed that the frequency of symptom posts that was strongly associated with daily new cases included changes in anxiety (r=–0.49; <italic>P</italic>=.009), changes in generalized pain (r=–0.46; <italic>P</italic>=.01), and changes in weight loss (r=–0.39; <italic>P</italic>=.04) (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The frequency of symptom-related posts that strongly correlated with daily changes in both new deaths and new active cases included anxiety (r=0.49, <italic>P</italic>=.008; r=0.59, <italic>P</italic>=.002, respectively); generalized pain (r=0.48, <italic>P</italic>=.01; r=0.59, <italic>P</italic>=.001, respectively); weight loss (r=0.39, <italic>P</italic>=.04; r=0.48, <italic>P</italic>=.01, respectively); fatigue (r=0.48, <italic>P</italic>=.01; r=0.53, <italic>P</italic>=.049; and changes in fatigue (r=0.09, <italic>P</italic>=.001; r=0.48, <italic>P</italic>=.009, respectively) (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <p>Correlations between the frequency of the 4 most commonly discussed symptoms and daily recovered cases were significant, and their Pearson correlation coefficients were –0.43 for anxiety, –0.44 for generalized pain, –0.55 for weight loss, and –0.51 for coughing, which indicated a negative and moderate correlation among them (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <p>When examining changes in the frequency of the top 5 most commonly mentioned symptom topic discussions over the 6-month study period, we noted a 24% increase in symptom posts mentioning anxiety, generalized pain, and fatigue during September 1-December 13, 2020 (vs June 14-August 31, 2020) (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Compared to June 14-August 31, 2020, posts mentioning the medical condition–related topics influenza, unspecified CNS disorders, and depression increased by more than 27% during September 1-December 13, 2020 (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). In terms of changes within the COVID-19–related symptoms subcategory, social media posts mentioning runny nose and change in the sense of taste and smell increased over 64%, while posts mentioning difficulty breathing decreased 1.5% during September 1-December 13, 2020 (vs June 14-August 31, 2020) (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Comparing changes in the number of posts on COVID-19 symptoms between June 14 and August 31, 2020, with those in September 1 to December 13, 2020 (N=277,401).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="200"/>
          <col width="200"/>
          <col width="200"/>
          <col width="200"/>
          <col width="200"/>
          <thead>
            <tr valign="top">
              <td>COVID-19–related symptoms per the Centers for Disease Control and Prevention’s definition<sup>a</sup></td>
              <td>Posts mentioning this COVID-19 symptoms, n (%)</td>
              <td>Posts during June 14-August 31, 2020, n</td>
              <td>Posts during September 1-December 13, 2020, n</td>
              <td>Changes in the number of posts, %</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Fatigue</td>
              <td>91,208 (32.88)</td>
              <td>36,876</td>
              <td>54,332</td>
              <td>47.33</td>
            </tr>
            <tr valign="top">
              <td>Coughing</td>
              <td>86,222 (31.08)</td>
              <td>41,163</td>
              <td>45,059</td>
              <td>9.46</td>
            </tr>
            <tr valign="top">
              <td>Fever</td>
              <td>59,906 (21.59)</td>
              <td>27,729</td>
              <td>32,177</td>
              <td>16.04</td>
            </tr>
            <tr valign="top">
              <td>Headache</td>
              <td>41,693 (15.02)</td>
              <td>18,052</td>
              <td>23,641</td>
              <td>30.96</td>
            </tr>
            <tr valign="top">
              <td>Vomiting</td>
              <td>39,103 (14.09)</td>
              <td>17,364</td>
              <td>21,739</td>
              <td>25.19</td>
            </tr>
            <tr valign="top">
              <td>Difficulty breathing</td>
              <td>33,589 (12.11)</td>
              <td>16,917</td>
              <td>16,672</td>
              <td>Decreased 1.45</td>
            </tr>
            <tr valign="top">
              <td>Nausea</td>
              <td>29,103 (10.49)</td>
              <td>13,039</td>
              <td>16,064</td>
              <td>23.19</td>
            </tr>
            <tr valign="top">
              <td>Itching/swelling</td>
              <td>28,337 (10.22)</td>
              <td>12,953</td>
              <td>15,384</td>
              <td>18.77</td>
            </tr>
            <tr valign="top">
              <td>Sore throat</td>
              <td>14,694 (5.29)</td>
              <td>6424</td>
              <td>8270</td>
              <td>28.74</td>
            </tr>
            <tr valign="top">
              <td>Diarrhea</td>
              <td>14,140 (5.09)</td>
              <td>6716</td>
              <td>7424</td>
              <td>10.54</td>
            </tr>
            <tr valign="top">
              <td>Chest pain</td>
              <td>9412 (3.39)</td>
              <td>4255</td>
              <td>5157</td>
              <td>21.19</td>
            </tr>
            <tr valign="top">
              <td>Abdominal pain</td>
              <td>9238 (3.33)</td>
              <td>4080</td>
              <td>5158</td>
              <td>26.42</td>
            </tr>
            <tr valign="top">
              <td>Runny nose</td>
              <td>8283 (2.98)</td>
              <td>3029</td>
              <td>5254</td>
              <td>73.46</td>
            </tr>
            <tr valign="top">
              <td>Body aches</td>
              <td>7871 (2.84)</td>
              <td>3540</td>
              <td>4331</td>
              <td>22.34</td>
            </tr>
            <tr valign="top">
              <td>Change in sense of taste</td>
              <td>6510 (2.35)</td>
              <td>2447</td>
              <td>4063</td>
              <td>66.04</td>
            </tr>
            <tr valign="top">
              <td>Muscle pain/spasms</td>
              <td>6321 (2.28)</td>
              <td>2816</td>
              <td>3505</td>
              <td>24.47</td>
            </tr>
            <tr valign="top">
              <td>Change in sense of smell</td>
              <td>6192 (2.23)</td>
              <td>2340</td>
              <td>3852</td>
              <td>64.62</td>
            </tr>
            <tr valign="top">
              <td>Confusional state</td>
              <td>3716 (1.34)</td>
              <td>1737</td>
              <td>1979</td>
              <td>13.93</td>
            </tr>
            <tr valign="top">
              <td>Chills</td>
              <td>2879 (1.04)</td>
              <td>1141</td>
              <td>1738</td>
              <td>52.32</td>
            </tr>
            <tr valign="top">
              <td>Drowsiness</td>
              <td>1256 (0.45)</td>
              <td>560</td>
              <td>696</td>
              <td>24.29</td>
            </tr>
            <tr valign="top">
              <td>Bluish lips/face</td>
              <td>1019 (0.37)</td>
              <td>404</td>
              <td>615</td>
              <td>52.23</td>
            </tr>
            <tr valign="top">
              <td>Inability to stay awake</td>
              <td>486 (0.18)</td>
              <td>195</td>
              <td>291</td>
              <td>49.23</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>The list of COVID-19 symptoms was updated on December 22, 2020, in accordance with the Centers for Disease Control and Prevention’s update. Our algorithms captured all posts mentioning any of these symptoms in the COVID-19 symptom subcategory; consequently, the posts may not necessarily represent patients discussing their own COVID-19 symptoms.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Associations between changes in new daily COVID-19 cases in the United States and the number of medical condition–related posts (June 13-December 13, 2020). (Note: the gray shaded area indicates daily active COVID-19 cases in the United States, while the colored curves showed fluctuations in posts mentioning different medical disorders during the study period). CNS: central nervous system.</p>
        </caption>
        <graphic xlink:href="publichealth_v7i9e29413_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Associations between changes in new daily COVID-19 cases in the United States and the number of symptoms posts (June 13-December 13, 2020). (Note: the gray shaded area indicated daily active COVID-19 cases in the United States, while the colored curves showed fluctuations in posts mentioning different symptoms during the study period).</p>
        </caption>
        <graphic xlink:href="publichealth_v7i9e29413_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we collected and analyzed web-based posts from forums and comments on news sites between June 14 and December 13, 2020. We found that a wide variety of symptoms and medical conditions topics were discussed on non-Twitter social media. While the vast majority of discussions were about COVID-19 infection and COVID-19–related symptoms (as defined by the CDC), neuropsychological symptoms (eg, anxiety) and other medical conditions (eg, infectious diseases and psychiatric disorders) were also frequently mentioned. Additionally, we noticed that changes in posts frequency of anxiety, generalized pain, and weight loss were significant but negatively correlated with daily new COVID-19 cases in the United States, and that the frequency of posts on anxiety, generalized pain, weight loss, fatigue, and the changes in fatigue positively and significantly correlated with daily changes in both new deaths and new active cases in the United States. As COVID-19 cases continued to rise globally, the cumulative volume of posts mentioning anxiety, generalized pain, fatigue, influenza, unspecified CNS disorders, and depression increased from September 1 to December 13, 2020 (compared to June 13 to August 31, 2020).</p>
        <p>Our findings expand on previous observations regarding the mental health effects of the COVID-19 pandemic among social media users by presenting a more complete picture of health-related topics discussed on social media [<xref ref-type="bibr" rid="ref18">18</xref>]. Our results not only confirm the findings from previous studies that showed high levels of anxiety and depression mentioned by social media users during the pandemic [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] but also revealed that the frequency of anxiety and other general health symptom–related posts, including generalized pain, weight loss, and fatigue, was significantly correlated with daily COVID-19 statistics. These data support the idea that social media represents a potential powerful source of information for health care professionals to draw real-time estimations about population health status [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Understanding health symptom posts commonly associated with COVID-19 statistics may inform public health researchers, clinicians, and policymakers to take timely and appropriate public health and clinical measures accordingly.</p>
        <p>Further, as access to the internet becomes more widely available and with the anonymity of social media, people who face barriers to accessing health care and those who have mental health symptoms may use social media to speak openly about their health experiences and seek help [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Collectively, these results further justify our approach to monitoring symptoms and medical condition posts on social media during the pandemic, and call for further investigation of the possibility of using social media analytics to gain insights into the population’s symptoms, including mental health symptoms, which are difficult to monitor outside of the health system, health threats, and to enhance public health preparedness.</p>
        <p>As the pandemic progresses, obtaining information on the symptom profile of COVID-19 could help to better diagnose and treat the disease. There has been increasing recognition of the importance of extracting social media information to explore symptom experience and disease progression among patients with COVID-19 [<xref ref-type="bibr" rid="ref38">38</xref>]. Although we did not restrict our analysis to only social media posts mentioning COVID-19 and could not verify the authors’ disease status, the most discussed COVID-19–related symptoms we found (eg, fatigue, cough, fever, headache, and difficulty breathing) were among the most common symptoms reported by patients with COVID-19 in other studies [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>]. Based on information extracted by applying COVID-19 disease status and diagnostic methods filters, we found that nearly 40% of non-Twitter social media users who discussed the top 5 most commonly mentioned symptom topics, such as fatigue and cough, also talked about the topic of having tested positive for COVID-19.</p>
        <p>We also noticed that approximately 15% of these discussions were related to asymptomatic COVID-19. While an in-depth exploration of these posts using qualitative analysis or sentiment analysis is necessary to help verify the users’ COVID-19 disease status, our preliminary data indicate the potential for extracting information from social media to understand the full spectrum of symptoms experienced by patients with COVID-19. Interestingly, we noticed an increase of over 60% in the volume of posts mentioning less common COVID-19 symptoms such as changes in the senses of taste and smell during the second stage of our study period (September 1 to December 13, 2020). This surge may be partly due to improvements in knowledge and awareness of COVID-19 symptoms in the general population as the 2 symptoms were recently added to the COVID-19 symptom lists of the CDC and the World Health Organization (late April 2020 and early May 2020, respectively).</p>
        <p>While there have been fluctuations in the volume of social media posts on a day-to-day basis, there appeared to be seasonal variation in the volume of discussion of symptoms and medical conditions. We noticed that the volume of most health-related discussions increased more from September 1 to December 13, 2020, than from June 14 to August 31, 2020. These changes may have been due to a combination of colder weather in the northern hemisphere and social distancing and limitations on daily life during the pandemic as well as the second wave of COVID-19, resulting in more social media users and more people being restricted indoors [<xref ref-type="bibr" rid="ref42">42</xref>]. Additionally, there were several inflection points in the volume of discussion of symptoms and medical conditions in the last 6 months. These changes appeared to have coincided with major news stories and national events, echoing findings from other studies that showed the potential impact of media coverage on web-based discussions [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. For example, the volume of all 5 commonly mentioned symptoms (anxiety, generalized pain, weight loss, fatigue, and cough) and 2 medical conditions (unspecified CNS and depression) peaked on October 10, 2020, the day on which hurricane Delta struck Louisiana and nearby states and left 730,000 homes and businesses without power [<xref ref-type="bibr" rid="ref43">43</xref>]. However, our study did not find evidence of an association between changes in the volume of symptom discussion over time and the trend of daily new confirmed cases of COVID-19 in the United States.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has several limitations. First, information on geolocation, demographics, and COVID-19 disease status was not available for all social media users in the study, owing to various legal limitations (such as General Data Protection Regulation of the European Union). This might have introduced a sampling bias if there were significant differences between social media users’ characteristics in our project and the real world. However, by collaborating with social media analytics companies, we have maximized our ability to access thousands of social media data sources worldwide, thus minimizing the possibility of sampling bias. Additionally, the majority of social media users in our study were from the United States. The findings, therefore, may not be generalizable in their application to users located in other countries. Further, we did not conduct formal statistical analyses beyond comparing the trends differences in frequency of health-related posts and new COVID-19 cases; hence, further testing is needed to confirm the associations between patterns of changes in symptom/medical condition posts and the fluctuations of COVID-19 statistics over time. Finally, we did not perform sentiment analysis or qualitative analysis in the study and did not verify whether authors who discussed COVID-19–related topics had COVID-19 themselves. We hope to accomplish and report this analysis in a future study. We also hope that other studies on social media’s role in public health will replicate and validate our exploratory findings in non-Twitter social media platforms.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this study, we classified web-based posts collected from June 14 to December 13, 2020, in accordance with discussions of symptoms and medical conditions. Neuropsychological symptoms such as anxiety were the most frequently mentioned symptom subcategory. Furthermore, COVID-19 infection was the most commonly mentioned medical condition. Our analysis also showed that frequency of anxiety and other general health symptoms posts, including generalized pain, weight loss, and fatigue, was significantly correlated with daily COVID-19 statistics in the United States. Additionally, health-related discussions were greater from September 1 to December 13, 2020, than from June 14 to August 31, 2020, aligning with the increase in COVID-19 cases in the United States during the winter months. These preliminary findings show promise for real-time monitoring of social media posts to measure the mental health status of a population during a global public health crisis and to assess the public’s main health needs that have not been captured or met by the existing health system. Future research may incorporate information from social media into predictive models for the detection of emerging infectious diseases.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary methods, figures, and tables.</p>
        <media xlink:href="publichealth_v7i9e29413_app1.docx" xlink:title="DOCX File , 2088 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CDC</term>
          <def>
            <p>Centers for Disease Control and Prevention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CNS</term>
          <def>
            <p>central nervous system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EVALI</term>
          <def>
            <p>e-cigarette or vaping use-associated lung injury</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank Center for Outcomes Research and Evaluation Yale New Haven Hospital for their coordination of the project. AC and Pini Matzner from Signals Analytics had full access to the data in the study and take responsibility for the integrity of the data and the accuracy of the data analysis. Signals, the analytic company, was acquired and is now part of Skai. QD takes full responsibility for the data interpretation and writing. All authors contributed to the editing and the approving of the final version of the paper for publication. This work was supported by the project Insights about the COVID Pandemic Using Public Data IRES PD: 20-005872 with funding from the Foundation for a Smoke-Free World.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>YL is supported by the National Heart, Lung, and Blood Institute (K12HL138037) and the Yale Center for Implementation Science. RD is supported by an American Heart Association Transformational Project Award (#19TPA34830013) and a Canadian Institutes of Health Research Project Grant (RN356054–401229). In the past 3 years, HMK received expenses and personal fees from UnitedHealth, IBM Watson Health, Element Science, Aetna, Facebook, the Siegfried and Jensen Law Firm, Arnold and Porter Law Firm, Martin/Baughman Law Firm, F-Prime, and the National Center for Cardiovascular Diseases in Beijing. He is an owner of Refactor Health and HugoHealth, and had grants and contracts from the Centers for Medicare &#38; Medicaid Services, Medtronic, the US Food and Drug Administration, Johnson &#38; Johnson, and the Shenzhen Center for Health Information. The remaining authors have no disclosures to report.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An interactive web-based dashboard to track COVID-19 in real time</article-title>
          <source>Lancet Infect Dis</source>
          <year>2020</year>
          <month>05</month>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>533</fpage>
          <lpage>534</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32087114"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="medline">32087114</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Lurie</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Social Media and Emergency Preparedness in Response to Novel Coronavirus</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>05</month>
          <day>26</day>
          <volume>323</volume>
          <issue>20</issue>
          <fpage>2011</fpage>
          <lpage>2012</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.4469</pub-id>
          <pub-id pub-id-type="medline">32202611</pub-id>
          <pub-id pub-id-type="pii">2763596</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clement</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Share of social media users in the United States who believe they will use select social media more if confined at home due to the coronavirus as of March 2020</article-title>
          <source>Statista</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.statista.com/statistics/1106343/social-usage-increase-due-to-coronavirus-home-usa/">https://www.statista.com/statistics/1106343/social-usage-increase-due-to-coronavirus-home-usa/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yousuf</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Corbin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sweep</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hofstra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Scherder</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>van Gorp</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zwetsloot</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Rossum</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lindemans</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Narula</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hofstra</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Association of a Public Health Campaign About Coronavirus Disease 2019 Promoted by News Media and a Social Influencer With Self-reported Personal Hygiene and Physical Distancing in the Netherlands</article-title>
          <source>JAMA Netw Open</source>
          <year>2020</year>
          <month>07</month>
          <day>01</day>
          <volume>3</volume>
          <issue>7</issue>
          <fpage>e2014323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jamanetwork.com/journals/jamanetworkopen/fullarticle/10.1001/jamanetworkopen.2020.14323"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.14323</pub-id>
          <pub-id pub-id-type="medline">32639569</pub-id>
          <pub-id pub-id-type="pii">2767992</pub-id>
          <pub-id pub-id-type="pmcid">PMC7344381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-Alrazaq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alhuwail</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Househ</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hamdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Top Concerns of Tweeters During the COVID-19 Pandemic: Infoveillance Study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>21</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e19016</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e19016/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19016</pub-id>
          <pub-id pub-id-type="medline">32287039</pub-id>
          <pub-id pub-id-type="pii">v22i4e19016</pub-id>
          <pub-id pub-id-type="pmcid">PMC7175788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wahbeh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nasralah</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Ramahi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>El-Gayar</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Mining Physicians' Opinions on Social Media to Obtain Insights Into COVID-19: Mixed Methods Analysis</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>06</month>
          <day>18</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e19276</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/2/e19276/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19276</pub-id>
          <pub-id pub-id-type="medline">32421686</pub-id>
          <pub-id pub-id-type="pii">v6i2e19276</pub-id>
          <pub-id pub-id-type="pmcid">PMC7304257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Calvo</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Deterding</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Health surveillance during covid-19 pandemic</article-title>
          <source>BMJ</source>
          <year>2020</year>
          <month>04</month>
          <day>06</day>
          <volume>369</volume>
          <fpage>m1373</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.m1373</pub-id>
          <pub-id pub-id-type="medline">32253180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>HO</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huynh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>YouTube as a source of information on COVID-19: a pandemic of misinformation?</article-title>
          <source>BMJ Glob Health</source>
          <year>2020</year>
          <month>05</month>
          <volume>5</volume>
          <issue>5</issue>
          <fpage>e002604</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gh.bmj.com/lookup/pmidlookup?view=long&#38;pmid=32409327"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjgh-2020-002604</pub-id>
          <pub-id pub-id-type="medline">32409327</pub-id>
          <pub-id pub-id-type="pii">bmjgh-2020-002604</pub-id>
          <pub-id pub-id-type="pmcid">PMC7228483</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Padrez</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the predictability of medical conditions from social media posts</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>e0215476</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0215476"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0215476</pub-id>
          <pub-id pub-id-type="medline">31206534</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-34864</pub-id>
          <pub-id pub-id-type="pmcid">PMC6576767</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Sherman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stokes</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Seltzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>Tracking Mental Health and Symptom Mentions on Twitter During COVID-19</article-title>
          <source>J Gen Intern Med</source>
          <year>2020</year>
          <month>09</month>
          <volume>35</volume>
          <issue>9</issue>
          <fpage>2798</fpage>
          <lpage>2800</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32638321"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-020-05988-8</pub-id>
          <pub-id pub-id-type="medline">32638321</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-020-05988-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7340749</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolliakou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bakolis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chandran</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Derczynski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Werbeloff</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Osborn</surname>
              <given-names>DPJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bontcheva</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Mental health-related conversations on social media and crisis episodes: a time-series regression analysis</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>02</month>
          <day>06</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>1342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-57835-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-57835-9</pub-id>
          <pub-id pub-id-type="medline">32029754</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-57835-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7005283</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fishman</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Casarett</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Mass media and medicine: when the most trusted media mislead</article-title>
          <source>Mayo Clin Proc</source>
          <year>2006</year>
          <month>03</month>
          <volume>81</volume>
          <issue>3</issue>
          <fpage>291</fpage>
          <lpage>293</lpage>
          <pub-id pub-id-type="doi">10.4065/81.3.291</pub-id>
          <pub-id pub-id-type="medline">16529129</pub-id>
          <pub-id pub-id-type="pii">S0025-6196(11)61454-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Czeisler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marynak</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Salah</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shakya</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Thierry</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>McMillan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wiley</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Czeisler</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Rajaratnam</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Delay or Avoidance of Medical Care Because of COVID-19-Related Concerns - United States, June 2020</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2020</year>
          <month>09</month>
          <day>11</day>
          <volume>69</volume>
          <issue>36</issue>
          <fpage>1250</fpage>
          <lpage>1257</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15585/mmwr.mm6936a4"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.mm6936a4</pub-id>
          <pub-id pub-id-type="medline">32915166</pub-id>
          <pub-id pub-id-type="pmcid">PMC7499838</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hui</surname>
              <given-names>DSC</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yuen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>N</given-names>
            </name>
            <collab>China Medical Treatment Expert Group for Covid-19</collab>
          </person-group>
          <article-title>Clinical Characteristics of Coronavirus Disease 2019 in China</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>04</month>
          <day>30</day>
          <volume>382</volume>
          <issue>18</issue>
          <fpage>1708</fpage>
          <lpage>1720</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32109013"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa2002032</pub-id>
          <pub-id pub-id-type="medline">32109013</pub-id>
          <pub-id pub-id-type="pmcid">PMC7092819</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>SWX</given-names>
            </name>
            <name name-style="western">
              <surname>Kalimuddin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Low</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Loh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Marimuthu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ang</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>Mak</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TY</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>TY</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Said</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kurupatham</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vasoo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>RTP</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>VJM</given-names>
            </name>
            <name name-style="western">
              <surname>Leo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lye</surname>
              <given-names>DC</given-names>
            </name>
            <collab>Singapore 2019 Novel Coronavirus Outbreak Research Team</collab>
          </person-group>
          <article-title>Epidemiologic Features and Clinical Course of Patients Infected With SARS-CoV-2 in Singapore</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>04</month>
          <day>21</day>
          <volume>323</volume>
          <issue>15</issue>
          <fpage>1488</fpage>
          <lpage>1494</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32125362"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2020.3204</pub-id>
          <pub-id pub-id-type="medline">32125362</pub-id>
          <pub-id pub-id-type="pii">2762688</pub-id>
          <pub-id pub-id-type="pmcid">PMC7054855</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rempel</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Carenini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Janjua</surname>
              <given-names>NZ</given-names>
            </name>
          </person-group>
          <article-title>Tracking COVID-19 Discourse on Twitter in North America: Infodemiology Study Using Topic Modeling and Aspect-Based Sentiment Analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>02</month>
          <day>10</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>e25431</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/2/e25431/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25431</pub-id>
          <pub-id pub-id-type="medline">33497352</pub-id>
          <pub-id pub-id-type="pii">v23i2e25431</pub-id>
          <pub-id pub-id-type="pmcid">PMC7879725</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boon-Itt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Skunkan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Public Perception of the COVID-19 Pandemic on Twitter: Sentiment Analysis and Topic Modeling Study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>11</month>
          <day>11</day>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e21978</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/4/e21978/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21978</pub-id>
          <pub-id pub-id-type="medline">33108310</pub-id>
          <pub-id pub-id-type="pii">v6i4e21978</pub-id>
          <pub-id pub-id-type="pmcid">PMC7661106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Valdez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ten Thij</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bathina</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rutter</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bollen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Social Media Insights Into US Mental Health During the COVID-19 Pandemic: Longitudinal Analysis of Twitter Data</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>12</month>
          <day>14</day>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>e21418</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/12/e21418/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21418</pub-id>
          <pub-id pub-id-type="medline">33284783</pub-id>
          <pub-id pub-id-type="pii">v22i12e21418</pub-id>
          <pub-id pub-id-type="pmcid">PMC7744146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spurlock</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Elgazzar</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Predicting COVID-19 Infection Groups using Social Networks and Machine Learning Algorithms</article-title>
          <year>2020</year>
          <conf-name>11th IEEE Annual Ubiquitous Computing, Electronics &#38; Mobile Communication Conference (UEMCON)</conf-name>
          <conf-date>October 28-31, 2020</conf-date>
          <conf-loc>New York, NY</conf-loc>
          <pub-id pub-id-type="doi">10.1109/uemcon51285.2020.9298093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>HTN</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Texas Public Agencies' Tweets and Public Engagement During the COVID-19 Pandemic: Natural Language Processing Approach</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>04</month>
          <day>26</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>e26720</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/4/e26720/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26720</pub-id>
          <pub-id pub-id-type="medline">33847587</pub-id>
          <pub-id pub-id-type="pii">v7i4e26720</pub-id>
          <pub-id pub-id-type="pmcid">PMC8078375</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the Potential Role of Social Media in Preventive Health Care</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>02</month>
          <day>04</day>
          <volume>323</volume>
          <issue>5</issue>
          <fpage>411</fpage>
          <lpage>412</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2019.21084</pub-id>
          <pub-id pub-id-type="medline">31922532</pub-id>
          <pub-id pub-id-type="pii">2758937</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Cuomo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Purushothaman</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Data Mining and Content Analysis of the Chinese Social Media Platform Weibo During the Early COVID-19 Outbreak: Retrospective Observational Infoveillance Study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>04</month>
          <day>21</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e18700</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/2/e18700/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18700</pub-id>
          <pub-id pub-id-type="medline">32293582</pub-id>
          <pub-id pub-id-type="pii">v6i2e18700</pub-id>
          <pub-id pub-id-type="pmcid">PMC7175787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Monroy-Hernández</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harry</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>André</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Panovich</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vargas</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>4chan and /b/: An Analysis of Anonymity and Ephemerality in a Large Online Community</article-title>
          <year>2011</year>
          <conf-name>Fifth International AAAI Conference on Weblogs and Social Media</conf-name>
          <conf-date>July 17-21, 2011</conf-date>
          <conf-loc>Barcelona</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojs.aaai.org/index.php/ICWSM/article/view/14134"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weichselbraun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brasoveanu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Waldvogel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Odoni</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Harvest - An Open Source Toolkit for Extracting Posts and Post Metadata from Web Forums</article-title>
          <year>2020</year>
          <conf-name>IEEE/WIC/ACM International Joint Conference on Web Intelligence and Intelligent Agent Technology (WI-IAT)</conf-name>
          <conf-date>December 14-17, 2020</conf-date>
          <conf-loc>Melbourne, VIC</conf-loc>
          <pub-id pub-id-type="doi">10.1109/wiiat50758.2020.00065</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prakasam</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Huxtable-Thomas</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Reddit: Affordances as an Enabler for Shifting Loyalties</article-title>
          <source>Inf Syst Front</source>
          <year>2020</year>
          <month>03</month>
          <day>26</day>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>723</fpage>
          <lpage>751</lpage>
          <pub-id pub-id-type="doi">10.1007/s10796-020-10002-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Babvey</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Capela</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cappa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lipizzi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Petrowski</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez-Marquez</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using social media data for assessing children's exposure to violence during the COVID-19 pandemic</article-title>
          <source>Child Abuse Negl</source>
          <year>2021</year>
          <month>06</month>
          <volume>116</volume>
          <issue>Pt 2</issue>
          <fpage>104747</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0145-2134(20)30402-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chiabu.2020.104747</pub-id>
          <pub-id pub-id-type="medline">33358281</pub-id>
          <pub-id pub-id-type="pii">S0145-2134(20)30402-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7498240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perrin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Share of U.S. adults using social media, including Facebook, is mostly unchanged since 2018</article-title>
          <source>Pew Research Center</source>
          <year>2019</year>
          <month>04</month>
          <day>10</day>
          <access-date>2021-06-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pewrsr.ch/2VxJuJ3">https://pewrsr.ch/2VxJuJ3</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Matni</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>What social media data should i use in my research?: A comparative analysis of twitter, youtube, reddit, and the new york times comments</article-title>
          <source>Proc Assoc Info Sci Tech</source>
          <year>2016</year>
          <month>12</month>
          <day>27</day>
          <volume>53</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/pra2.2016.14505301151"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pra2.2016.14505301151</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>meet skai smarter, faster go-to-market</article-title>
          <source>Skai</source>
          <access-date>2020-12-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.signals-analytics.com">https://www.signals-analytics.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <article-title>How can we help drive your business?</article-title>
          <source>NetBase Quid</source>
          <access-date>2020-12-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://netbasequid.com">https://netbasequid.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Axisbits</collab>
          </person-group>
          <article-title>COVID-19 Statistics</article-title>
          <source>Rapid API</source>
          <access-date>2021-01-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://rapidapi.com/axisbits-axisbits-default/api/covid-19-statistics/details">https://rapidapi.com/axisbits-axisbits-default/api/covid-19-statistics/details</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oren</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Moed</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Matzner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Caraballo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Krumholz</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Engagement With COVID-19 Public Health Measures in the United States: A Cross-sectional Social Media Analysis from June to November 2020</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>06</month>
          <day>21</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e26655</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e26655/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26655</pub-id>
          <pub-id pub-id-type="medline">34086593</pub-id>
          <pub-id pub-id-type="pii">v23i6e26655</pub-id>
          <pub-id pub-id-type="pmcid">PMC8218897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matzner</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Using advance analytics for the early detection of pandemics and outbreaks</article-title>
          <source>Signals Analytics</source>
          <access-date>2021-01-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://info.signals-analytics.com/research-paper-early-detection-pandemics">https://info.signals-analytics.com/research-paper-early-detection-pandemics</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>Symptoms of COVID-19</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2020-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html">https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>How to deal with the negative psychological impact of COVID-19 for people who pay attention to anxiety and depression</article-title>
          <source>Precis Clin Med</source>
          <year>2020</year>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>161</fpage>
          <lpage>168</lpage>
          <pub-id pub-id-type="doi">10.1093/pcmedi/pbaa023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A nationwide survey of psychological distress among Chinese people in the COVID-19 epidemic: implications and policy recommendations</article-title>
          <source>Gen Psychiatr</source>
          <year>2020</year>
          <volume>33</volume>
          <issue>2</issue>
          <fpage>e100213</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32215365"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/gpsych-2020-100213</pub-id>
          <pub-id pub-id-type="medline">32215365</pub-id>
          <pub-id pub-id-type="pii">gpsych-2020-100213</pub-id>
          <pub-id pub-id-type="pmcid">PMC7061893</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Harnessing social media for health information management</article-title>
          <source>Electron Commer Res Appl</source>
          <year>2018</year>
          <volume>27</volume>
          <fpage>139</fpage>
          <lpage>151</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30147636"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.elerap.2017.12.003</pub-id>
          <pub-id pub-id-type="medline">30147636</pub-id>
          <pub-id pub-id-type="pmcid">PMC6105292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Picone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Inoue</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>DeFelice</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Naujokas</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Sinrod</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Stapleton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sinrod</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Diebel</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Wassman</surname>
              <given-names>ER</given-names>
            </name>
          </person-group>
          <article-title>Social Listening as a Rapid Approach to Collecting and Analyzing COVID-19 Symptoms and Disease Natural Histories Reported by Large Numbers of Individuals</article-title>
          <source>Popul Health Manag</source>
          <year>2020</year>
          <month>10</month>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>350</fpage>
          <lpage>360</lpage>
          <pub-id pub-id-type="doi">10.1089/pop.2020.0189</pub-id>
          <pub-id pub-id-type="medline">32897820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lakamana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hogg-Bremer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Garadi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Self-reported COVID-19 symptoms on Twitter: an analysis and a research resource</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>08</month>
          <day>01</day>
          <volume>27</volume>
          <issue>8</issue>
          <fpage>1310</fpage>
          <lpage>1315</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32620975"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa116</pub-id>
          <pub-id pub-id-type="medline">32620975</pub-id>
          <pub-id pub-id-type="pii">5867237</pub-id>
          <pub-id pub-id-type="pmcid">PMC7337747</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Killerby</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Newton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ashworth</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Berns</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bressler</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Bye</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Crawford</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harduar Morano</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Markus</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Read</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Rissman</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tate</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Midgley</surname>
              <given-names>CM</given-names>
            </name>
            <collab>Case Investigation Form Working Group</collab>
          </person-group>
          <article-title>Symptom Profiles of a Convenience Sample of Patients with COVID-19 - United States, January-April 2020</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2020</year>
          <month>07</month>
          <day>17</day>
          <volume>69</volume>
          <issue>28</issue>
          <fpage>904</fpage>
          <lpage>908</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15585/mmwr.mm6928a2"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.mm6928a2</pub-id>
          <pub-id pub-id-type="medline">32673296</pub-id>
          <pub-id pub-id-type="pmcid">PMC7366851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alimohamadi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sepandi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Taghdir</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hosamirudsari</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Determine the most common clinical symptoms in COVID-19 patients: a systematic review and meta-analysis</article-title>
          <source>J Prev Med Hyg</source>
          <year>2020</year>
          <month>09</month>
          <volume>61</volume>
          <issue>3</issue>
          <fpage>E304</fpage>
          <lpage>E312</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15167/2421-4248/jpmh2020.61.3.1530"/>
          </comment>
          <pub-id pub-id-type="doi">10.15167/2421-4248/jpmh2020.61.3.1530</pub-id>
          <pub-id pub-id-type="medline">33150219</pub-id>
          <pub-id pub-id-type="pmcid">PMC7595075</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Lurie</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Social Media and Emergency Preparedness in Response to Novel Coronavirus</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>05</month>
          <day>26</day>
          <volume>323</volume>
          <issue>20</issue>
          <fpage>2011</fpage>
          <lpage>2012</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.4469</pub-id>
          <pub-id pub-id-type="medline">32202611</pub-id>
          <pub-id pub-id-type="pii">2763596</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aretakis</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hauck</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Delta lives updates: Hundreds of thousands without power across south; Louisiana governor urges caution as clean-up begins</article-title>
          <source>USA Today</source>
          <access-date>2020-12-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.usatoday.com/story/news/nation/2020/10/10/hurricane-delta-update-damage-weakens-tropical-storm-power-outages/5952093002/">https://www.usatoday.com/story/news/nation/2020/10/10/hurricane-delta-update-damage-weakens-tropical-storm-power-outages/5952093002/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
