<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i12e32814</article-id>
      <article-id pub-id-type="pmid">34665761</article-id>
      <article-id pub-id-type="doi">10.2196/32814</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Factors Driving the Popularity and Virality of COVID-19 Vaccine Discourse on Twitter: Text Mining and Data Visualization Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Xie</surname>
            <given-names>Wenjing</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Turner</surname>
            <given-names>Jason</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Jueman</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2653-5914</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Yi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2293-3664</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Shi</surname>
            <given-names>Molu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8586-4999</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Xiuli</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>School of New Media</institution>
            <institution>Peking University</institution>
            <addr-line>5 Yiheyuan Road</addr-line>
            <addr-line>Haidian District</addr-line>
            <addr-line>Beijing, 100871</addr-line>
            <country>China</country>
            <phone>86 10 6276 6689</phone>
            <email>xiuli.wang@pku.edu.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6954-7475</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Polk School of Communications</institution>
        <institution>Long Island University</institution>
        <addr-line>Brooklyn, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Communication</institution>
        <institution>University of Louisville</institution>
        <addr-line>Louisville, KY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <addr-line>Louisville, KY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of New Media</institution>
        <institution>Peking University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xiuli Wang <email>xiuli.wang@pku.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>12</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>12</month>
        <year>2021</year>
      </pub-date>
      <volume>7</volume>
      <issue>12</issue>
      <elocation-id>e32814</elocation-id>
      <history>
        <date date-type="received">
          <day>10</day>
          <month>8</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>9</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>10</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>10</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Jueman Zhang, Yi Wang, Molu Shi, Xiuli Wang. Originally published in JMIR Public Health and Surveillance (https://publichealth.jmir.org), 03.12.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on https://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://publichealth.jmir.org/2021/12/e32814" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>COVID-19 vaccination is considered a critical prevention measure to help end the pandemic. Social media platforms such as Twitter have played an important role in the public discussion about COVID-19 vaccines.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to investigate message-level drivers of the popularity and virality of tweets about COVID-19 vaccines using machine-based text-mining techniques. We further aimed to examine the topic communities of the most liked and most retweeted tweets using network analysis and visualization.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We collected US-based English-language public tweets about COVID-19 vaccines from January 1, 2020, to April 30, 2021 (N=501,531). Topic modeling and sentiment analysis were used to identify latent topics and valence, which together with autoextracted information about media presence, linguistic features, and account verification were used in regression models to predict likes and retweets. Among the 2500 most liked tweets and 2500 most retweeted tweets, network analysis and visualization were used to detect topic communities and present the relationship between the topics and the tweets.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Topic modeling yielded 12 topics. The regression analyses showed that 8 topics positively predicted likes and 7 topics positively predicted retweets, among which the topic of vaccine development and people’s views and that of vaccine efficacy and rollout had relatively larger effects. Network analysis and visualization revealed that the 2500 most liked and most retweeted retweets clustered around the topics of vaccine access, vaccine efficacy and rollout, vaccine development and people’s views, and vaccination status. The overall valence of the tweets was positive. Positive valence increased likes, but valence did not affect retweets. Media (photo, video, gif) presence and account verification increased likes and retweets. Linguistic features had mixed effects on likes and retweets.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study suggests the public interest in and demand for information about vaccine development and people’s views, and about vaccine efficacy and rollout. These topics, along with the use of media and verified accounts, have enhanced the popularity and virality of tweets. These topics could be addressed in vaccine campaigns to help the diffusion of content on Twitter.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>COVID-19</kwd>
        <kwd>vaccine</kwd>
        <kwd>topic modeling</kwd>
        <kwd>LDA</kwd>
        <kwd>valence</kwd>
        <kwd>share</kwd>
        <kwd>viral</kwd>
        <kwd>Twitter</kwd>
        <kwd>social media</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Since the World Health Organization (WHO) declared the COVID-19 outbreak a pandemic in March 2020 [<xref ref-type="bibr" rid="ref1">1</xref>], the United States has seen the highest number of confirmed cases and deaths [<xref ref-type="bibr" rid="ref2">2</xref>]. Many health organizations, including the WHO [<xref ref-type="bibr" rid="ref3">3</xref>] and the US Centers for Disease Control and Prevention (CDC) [<xref ref-type="bibr" rid="ref4">4</xref>], consider vaccination as a critical prevention measure to help end the pandemic and restore society to its normal status. Owing to remarkable advances in vaccinology, scientists developed COVID-19 vaccines within an unprecedented short time. In December 2021, less than 1 year after the virus was identified, the first two vaccines were approved for emergency use in the United States: the Pfizer-BioNTech vaccine and the Moderna vaccine [<xref ref-type="bibr" rid="ref5">5</xref>]. Both of these vaccines use messenger RNA (mRNA)-based technology, which had not been approved previously for general use in humans [<xref ref-type="bibr" rid="ref5">5</xref>]. Johnson &#38; Johnson’s Janssen vaccine, which is based on a slightly more mature technology of a viral vector, became the third vaccine approved for emergency use in the United States in February 2020 [<xref ref-type="bibr" rid="ref6">6</xref>]. Owing to their novelty, COVID-19 vaccines had potential to fuel the existing vaccine debate, including arguments over vaccine safety and effectiveness, which had received notable attention in recent years before the pandemic [<xref ref-type="bibr" rid="ref7">7</xref>]. In addition, political polarization, reaffirmed in the 2020 presidential election, was manifested in a wide range of issues, including responses to the COVID-19 pandemic [<xref ref-type="bibr" rid="ref8">8</xref>] and vaccines [<xref ref-type="bibr" rid="ref9">9</xref>]. Generally, Democrats had more favorable attitudes toward COVID-19 vaccines than Republicans [<xref ref-type="bibr" rid="ref9">9</xref>]. These political fissures further had potential to propel the vaccine debate. Amidst the heated discussion of COVID-19 vaccines, the United States has been rolling out the most massive vaccination campaign in its history to fight against the pandemic [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
        <p>Investigating public discourse about COVID-19 vaccines will shed light on people’s perception and attitudes. As a major social media platform and a vital source for text-based public discourse, Twitter has been studied to understand public discourse about vaccines in general [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>] and about specific vaccines, including COVID-19 vaccines [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Text-mining techniques have been increasingly used in recent research to investigate tweets about the COVID-19 pandemic (eg, [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]) and about COVID-19 vaccines [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. These studies have employed machine learning algorithms to automatically analyze massive amounts of tweets and capture latent textual information such as topics, sentiment, and trends.</p>
        <p>Although text mining is clearly an effective way to identify underlying textual clusters and patterns from vast amounts of tweets, less is known about how such information can help to understand the diffusion of information and opinions on Twitter. The aim of this study was to investigate message-level drivers of the popularity and virality of tweets about COVID-19 vaccines using text-mining techniques. Specifically, the objective of the study was to investigate how text-mined topics and valence, together with social media message features affect likes and retweets. Another aim of the study was to examine the topic communities of the most liked and most retweeted tweets using network analysis and visualization. These findings have implications for the direction of vaccine campaigns.</p>
      </sec>
      <sec>
        <title>Literature Review</title>
        <p>The extent to which a message results in optimal diffusion on social media can be assessed by users’ favorable responses such as clicking “like” and “share” buttons to overtly indicate individual interest and support [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. On Twitter, users can click on the “Like” icon to show appreciation for a tweet or on the “Retweet” icon to share it publicly with their followers [<xref ref-type="bibr" rid="ref24">24</xref>]. Prior research has considered the like count of a tweet as an indicator of its popularity and the retweet count of a tweet as an indicator of its virality [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Drawing on these studies [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>], we assessed the popularity of a tweet by the number of likes and assessed the virality of a tweet by the number of retweets. Compared with liking, retweeting is a more social behavior [<xref ref-type="bibr" rid="ref26">26</xref>]. For both responses, the bandwagon effect postulates that the adoption of trends increases more with respect to the number of people who have already done so [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>This study investigated three categories of message-level factors that, according to prior research, can drive the diffusion of media content online: information, emotion, and social media message features. As Twitter is a major source of text-based information, we drew on the literature related to the social transmission of online text information, including news articles and tweets. Past research on the virality of online news has suggested two categories of determinants: informational and emotional. From the informational perspective, information utility, as gauged by overall content usefulness, was found to prompt social media sharing of general news articles [<xref ref-type="bibr" rid="ref27">27</xref>]. In the health context, a content attribute that taps into information utility is the presence of efficacy information [<xref ref-type="bibr" rid="ref26">26</xref>], which provides ways to promote health or overcome a health risk [<xref ref-type="bibr" rid="ref28">28</xref>]. Research has shown that overall content usefulness and presence of efficacy information both facilitate viewing and sharing of health news articles on social media [<xref ref-type="bibr" rid="ref26">26</xref>]. In the situation of the COVID-19 pandemic, gaps in knowledge about the new coronavirus was evident in the United States early on [<xref ref-type="bibr" rid="ref29">29</xref>] and demand for information of practical value was expected [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. In addition, according to the uncertainty reduction theory, to alleviate risks in crises, people intend to engage in uncertainty reduction efforts by collecting credible information and sharing with others [<xref ref-type="bibr" rid="ref25">25</xref>]. Nanath and Joy’s [<xref ref-type="bibr" rid="ref25">25</xref>] text mining study revealed that the optimism and solution topic as well as the mental health topic were positive predictors of retweet counts of COVID-19–related tweets. In addition to information utility, novel content in health news has been found to increase sharing [<xref ref-type="bibr" rid="ref26">26</xref>]. COVID-19 vaccines were newly developed to help fight off the new coronavirus; thus, content related to aspects such as development and efficacy had the intrinsic feature of novelty and could potentially help to close the knowledge gaps.</p>
        <p>Past research has generally shown that there were more positive than negative tweets on Twitter about vaccines in general [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>] and about COVID-19 vaccines in particular [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Although positive content has been found to increase likes on social media [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], the findings are mixed regarding the impact of valence on the virality of online content. Berger and Milkman [<xref ref-type="bibr" rid="ref27">27</xref>] found that positive sentiment increased social media sharing of general news. A plausible explanation is that positive sharing reflects the positivity of the sender [<xref ref-type="bibr" rid="ref26">26</xref>], which may enhance self-presentation [<xref ref-type="bibr" rid="ref31">31</xref>] and identity communication [<xref ref-type="bibr" rid="ref27">27</xref>]. However, Nanath and Joy [<xref ref-type="bibr" rid="ref25">25</xref>] found that negative emotions increased the social transmission of COVID-19–related tweets. Moreover, Blankenship et al [<xref ref-type="bibr" rid="ref11">11</xref>] revealed that antivaccine tweets were retweeted more than provaccine tweets. In comparison, Kim [<xref ref-type="bibr" rid="ref26">26</xref>] revealed that content valence was unrelated to the virality of health news on social media.</p>
        <p>In addition to content topic and valence, social media message features, including media presence, linguistic features, and account verification, could impact the popularity and virality of online content. Media presence and linguistic features can affect content processing fluency and further affect favorable online responses such as liking and retweeting. Content on social media may be of any mode such as text, photos, and videos. Past research has shown that a tweet with embedded media (ie, a photo or a video) stimulates likes and retweets [<xref ref-type="bibr" rid="ref23">23</xref>]. It is postulated that the cognitive processing of photos is more fluent than that of words as it is faster to activate the semantic meaning of photos than that of words [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. Therefore, tweets featuring embedded media are more likely to trigger favorable online responses.</p>
        <p>In comparison, past research has revealed that linguistic features such as the number of hashtags, mentions, and external links decrease likes [<xref ref-type="bibr" rid="ref23">23</xref>] and retweets [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. It is suggested that these features increase content processing disfluency in two aspects. First, compared to the black color adopted by text, the blue color adopted by hashtags, mentions, and external links decreases the font-background contrast and causes visual perpetual disfluency [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Second, the nonalphanumeric symbols used by hashtags, mentions, and external links (ie, #, @, ://) create orthographical disfluency [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The content disfluency requires more cognitive effort to process the message and hence decreases favorable responses [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>Finally, account features could potentially affect likes and retweets. In the face of information explosion in the digital age, account authenticity could be of particular importance in the diffusion of information. On Twitter, verified accounts have a blue badge next to the profile name to let users know that it is authentic. Twitter paused public submissions for account verification in 2017 and reopened the gate using a new application process in May 2021 [<xref ref-type="bibr" rid="ref36">36</xref>]. The end date of our data retrieval was April 30, 2021, and therefore the data did not reflect the newly verified accounts. In addition, it is noteworthy that the tweets posted by verified accounts may not be verified.</p>
      </sec>
      <sec>
        <title>Research Model and Questions</title>
        <p>This study contributes to the literature by providing a conceptual model to understand the combined effects of the three above-mentioned categories of factors—content topics, content valance, and social media message features, including media presence, linguistic features, and account verification—on the popularity and virality of tweets about COVID-19 vaccines. We employed topic modeling to identify latent topics of tweets. We employed sentiment analysis to assess the valence of tweets. Automated extraction generated data about social media features. Therefore, we put forward the following research questions:</p>
        <disp-quote>
          <p>Research question 1 (RQ1): How do content topics, content valence, and social media message features affect the popularity of tweets about COVID-19 vaccines?</p>
        </disp-quote>
        <disp-quote>
          <p>Research question 2 (RQ2): How do content topics, content valence, and social media message features affect the virality of tweets about COVID-19 vaccines?</p>
        </disp-quote>
        <p>In addition, among the 2500 most liked and most retweeted tweets, respectively, we used network analysis and visualization to detect topic communities and present the relationship between the topics and the tweets. We had the following research questions:</p>
        <disp-quote>
          <p>Research question 3 (RQ3): What are the salient topics of the most liked tweets?</p>
        </disp-quote>
        <disp-quote>
          <p>Research question 4 (RQ4): What are the salient topics of the most retweeted tweets?</p>
        </disp-quote>
        <p>This study can help to advance knowledge on complex drivers of the popularity and virality of tweets about COVID-19 vaccines using machine-based text mining and network visualization in the context of a heated vaccine debate in the United States. These findings offer practical implications for health practitioners to employ more effective social media content.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Source</title>
        <p>We collected publicly available original tweets about COVID-19 vaccines from January 1, 2020, to April 30, 2021, using snscrape [<xref ref-type="bibr" rid="ref37">37</xref>], which were further filtered according to user profile data to include only English-language tweets and those from US-based users. This approach resulted in 501,531 tweets recorded in the final dataset.</p>
        <p>Drawing on prior social media studies on vaccines [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>], we developed keywords by balancing the general COVID-19 vaccine information with brand-specific information. As of April 30, 2021, which was our data retrieval end date, Pfizer-BioNTech, Moderna, and Johnson &#38; Johnson/Janssen vaccines were authorized for emergency use in the United States [<xref ref-type="bibr" rid="ref40">40</xref>]. At that time, the three vaccines, together with the AstraZeneca vaccine, had conditional marketing authorizations in European Union countries [<xref ref-type="bibr" rid="ref41">41</xref>]. Although the AstraZeneca vaccine was not used in the United States, it garnered media and public attention in the United States, and therefore we also included this brand in the search. In addition, as COVID-19 vaccines varied in terms of the underlying technology, we considered technology-specific information. Pfizer-BioNTech and Moderna used mRNA technology, and Johnson &#38; Johnson and AstraZeneca-Oxford used viral vector technology. Moreover, we checked government Twitter accounts such as the US CDC and Food and Drug Administration accounts to explore hashtags. Finally, the following strategy was used to scrape Twitter data. A tweet had to contain the keyword (case-insensitive unless otherwise specified) “vaccine,” together with one of the keywords “COVID,” “COVID19,” “COVID-19,” “Pfizer,” “Pfizer-BioNTech,” “Moderna,” “Johnson &#38; Johnson,” “Janssen,” “AstraZeneca,” and “Oxford-AstraZeneca”; or contain the keyword “vaccine” together with one of the following combinations: “mRNA” and “COVID,” “viral vector” and “COVID,” and “adenovirus” and “COVID”; or contain either of the two hashtags “#covid19vaccine” and “#covidvaccine.”</p>
      </sec>
      <sec>
        <title>Data Processing</title>
        <p>The final dataset was preprocessed via genism [<xref ref-type="bibr" rid="ref42">42</xref>] for topic modeling and sentiment analysis. We tokenized each tweet as a list of words [<xref ref-type="bibr" rid="ref43">43</xref>], and removed high-frequency stop words such as “https” and “covid,” in addition to the standard nltk stop words library [<xref ref-type="bibr" rid="ref44">44</xref>], which were not expected to contribute to the uniqueness of each topic. The text corpus was then trained to recognize frequent bigrams such as “New York,” using a gensim bigram model [<xref ref-type="bibr" rid="ref42">42</xref>]. Next, all words were lemmatized to their dictionary form [<xref ref-type="bibr" rid="ref43">43</xref>] to reduce redundancy in the bag of words (BOW) encoding. Finally, these lemmatized single words (ie, unigrams) and bigrams recognized by the bigram model were used to build the BOW representation for our latent Dirichlet allocation (LDA) model. That is, the corpus was encoded as a vector space, with each vector component representing a lemma.</p>
      </sec>
      <sec>
        <title>Measures</title>
        <sec>
          <title>Like Count</title>
          <p>The like count of each tweet, which is the number of likes a tweet gets, was captured in the data set. As a small number of tweets generated a great number of likes, the distribution was right-skewed. To reduce right skewness, we used the natural logarithm of like counts in statistical analyses, as in past research [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        </sec>
        <sec>
          <title>Retweet Count</title>
          <p>The retweet count of each tweet, which is the number of retweets a tweet gets, was captured in the data set. Similar to like counts, retweet counts had a right-skewed distribution. To reduce right skewness, we used the natural logarithm of retweet counts in statistical analyses, as in past research [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        </sec>
        <sec>
          <title>Content Topic</title>
          <p>The tweets were subjected to topic modeling using the LDA model [<xref ref-type="bibr" rid="ref45">45</xref>]. Topic modeling is a commonly used unsupervised learning method that generates a probabilistic model for the corpus of text data [<xref ref-type="bibr" rid="ref46">46</xref>]. As one of the two main topic models [<xref ref-type="bibr" rid="ref46">46</xref>], LDA is increasingly being used to analyze textual data [<xref ref-type="bibr" rid="ref47">47</xref>], including tweets (eg, [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]).</p>
          <p>LDA depends on two matrices to define the latent topical structure: the word-topic matrix and the document-topic matrix [<xref ref-type="bibr" rid="ref47">47</xref>]. In our study, a document was a tweet. The general idea is that a tweet is represented by a Dirichlet distribution of latent topics, where each latent topic is represented by a Dirichlet distribution of words [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
          <p>The word-topic matrix reveals the conditional probability with which a word is likely to occur in a topic. The word-topic matrix is used to interpret the topics. A topic can be interpreted by examining a list of the most probable words ranked solely by their frequency to occur in that topic, using 3 to 30 words [<xref ref-type="bibr" rid="ref48">48</xref>]. To aid topic interpretation, we also considered the ranking of the most probable topic-specific words by both frequency and relevance, as suggested by Sievert and Shirley [<xref ref-type="bibr" rid="ref48">48</xref>]. The relevance for ranking words within a topic is indexed by a weight parameter, λ, with a value ranging from 0 to 1. A value closer to 0 highlights rare but exclusive words for the topic and a value closer to 1 highlights frequent but not necessarily exclusive words for the topic [<xref ref-type="bibr" rid="ref48">48</xref>]. We adopted the recommended λ of 0.6 [<xref ref-type="bibr" rid="ref48">48</xref>]. Lastly, we reviewed sample tweets with the highest topic-specific loadings to finalize topic interpretations.</p>
          <p>The document-topic matrix reveals the conditional probability with which a topic is likely to occur in a tweet. In other words, it reveals the topic loadings for each tweet. The information was used in the regression models for prediction as well as in network analysis and visualization. The topic loading value ranges from 0 to 1, with a value closer to 1 indicating the higher topic loading of a tweet.</p>
        </sec>
        <sec>
          <title>Content Valence</title>
          <p>We used TextBlob [<xref ref-type="bibr" rid="ref49">49</xref>], an open-source python library, to generate the valence score of each tweet. The range of the valence score is from –1 to 1, with the value of –1 indicating the most negative and the value of 1 indicating the most positive valence.</p>
        </sec>
        <sec>
          <title>Media Presence</title>
          <p>Data on whether a tweet had a photo, gif, or video were extracted, respectively.</p>
        </sec>
        <sec>
          <title>Linguistic Features</title>
          <p>The numbers of hashtags, mentions, and hyperlinks were extracted, respectively.</p>
        </sec>
        <sec>
          <title>Account Verification</title>
          <p>For each tweet, whether the account that posted it was verified or not was extracted.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>We performed linear regression analyses to examine the predictors of likes and retweets. Since the purpose of the study was to investigate the factors that affected the popularity and virality of tweets as indexed by like counts and retweet counts, we only considered the tweets that were liked and retweeted, as in past research [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. In the models, the log-transformed like counts and retweet counts were respectively regressed on 12 topic loadings extracted from topic modeling, the valence score generated from sentiment analysis, three variables of media presence, three variables of linguistic features, and account verification.</p>
      </sec>
      <sec>
        <title>Network Analysis and Visualization</title>
        <p>We used two-mode visualization to present the relationship between topics and the 2500 most liked tweets and the 2500 most retweeted tweets, respectively. To prepare data for rendering each relationship network, we created a node list consisting of topic and tweet nodes, and an edge list consisting of tweet IDs, the topics each tweet was connected to, and an edge weight representing the topic loading of each tweet. Each topic node with its name was sized in proportion to the sum of topic loadings of all tweets. To assist the viewer in discerning topics, we used a community detection algorithm built in Gephi [<xref ref-type="bibr" rid="ref50">50</xref>], which is based on the Louvain modularity method that has been used in prior research [<xref ref-type="bibr" rid="ref12">12</xref>]. Community detection algorithms [<xref ref-type="bibr" rid="ref51">51</xref>] identify cohesive groups in the network [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]. In the network visualization, node color reflected topic community membership.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Content Topics</title>
        <p>We trained a topic model using LDA, with a search space on topic numbers from 3 to 21. Using a uniform search grid on Dirichlet concentration parameters, the model parameters were trained to optimize the coherence score <italic>C<sub>v</sub></italic> [<xref ref-type="bibr" rid="ref54">54</xref>], which is a likelihood measure of word cooccurrence in the same topics. The best model was achieved at 12 topics with <italic>C<sub>v</sub></italic>=0.42. <xref ref-type="table" rid="table1">Table 1</xref> summarizes the 12 topics. Interpretation of each topic was based on the top 10 probable words ranked solely by frequency and jointly by frequency and relevance, as well as review of sample tweets with high topic-specific loadings.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of topics and valence.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="170"/>
            <col width="320"/>
            <col width="330"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td>Topic<break/>number</td>
                <td>Topic label</td>
                <td>Top 10 words by frequency (λ=1)</td>
                <td>Top 10 words by frequency and relevance (λ=0.6)</td>
                <td>Valence</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Vaccine access</td>
                <td>vaccine, community, health, help, access, need, work, pandemic, country, support</td>
                <td>vaccine, community, health, access, help, support, effort, global, distribution, ensure</td>
                <td>0.137</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Vaccine efficacy and rollout</td>
                <td>vaccine, case, new, variant, show, death, test, risk, virus, report</td>
                <td>case, vaccine, variant, show, new, test, death, study, pause, report</td>
                <td>0.147</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Vaccine development and people’s views</td>
                <td>vaccine, people, take, say, would, do, want, think, give, woman</td>
                <td>vaccine, would, take, woman, people, think, enough, do, say, try</td>
                <td>0.158</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Vaccination status</td>
                <td>get, vaccine, vaccinate, shot, people, shoot, vaccinated, first, fully, wait</td>
                <td>get, vaccinate, shot, shoot, people, vaccinated, fully, family, wait, die</td>
                <td>0.143</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Feeling and side effect</td>
                <td>get, vaccine, feel, go, good, day, side effect, make, work, arm</td>
                <td>feel, get, side effect, good, go, arm, day, fact, science, normal</td>
                <td>0.117</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Vaccine appointment</td>
                <td>vaccine, appointment, today, site, schedule, open, visit, call, clinic, vaccination</td>
                <td>appointment, site, vaccine, open, schedule, visit, clinic, join, register, call</td>
                <td>0.133</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Vaccine availability</td>
                <td>vaccine, available, week, say, year, question, old, last, next, come</td>
                <td>available, question, old, year, week, say, last, next, answer, month</td>
                <td>0.149</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Vaccination eligibility and administration</td>
                <td>dose, vaccine, receive, today, first, second, eligible, administer, day, start</td>
                <td>dose, receive, second, eligible, today, first, administer, vaccine, day, begin</td>
                <td>0.354</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Age and issues</td>
                <td>age, vaccine, offer, people, group, encourage, read, rollout, issue, concern</td>
                <td>age, offer, group, encourage, rollout, reason, article, issue, explain, doctor</td>
                <td>0.107</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Preventive measures</td>
                <td>safe, mask, keep, spread, stop, stay, wear, still, continue, passport</td>
                <td>safe, mask, keep, spread, stop, stay, wear, passport, place, home</td>
                <td>0.089</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Student and county</td>
                <td>retweet, check, student, event, walk, turn, county, staff, please, team</td>
                <td>retweet, check, student, event, walk, turn, county, staff, please, team</td>
                <td>0.093</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>Trust and communication</td>
                <td>share, trust, watch, video, speak, play, minute, fall, head, availability</td>
                <td>share, trust, video, speak, play, minute, watch, fall, head, availability</td>
                <td>0.089</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Content Valence</title>
        <p>The overall valence was positive, with a score of 0.145. The range of the valence score is from –1 to 1, with –1 indicating the most negative and 1 indicating the most positive valence. As shown in <xref ref-type="table" rid="table1">Table 1</xref>, all 12 topics were associated with positive valence.</p>
      </sec>
      <sec>
        <title>Determinants of Like Counts</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> reveals the effects of the four categories of independent variables on the log-transformed like counts. The regression model was significant at <italic>P</italic>&#60;.001 (adjusted <italic>R<sup>2</sup></italic>=0.151). RQ1 was related to the determinants of likes. Out of the 12 latent topics identified by topic modeling, Topics 1 to 8 had weak but significant effects on likes. The valence also had a weak but significant effect on likes. Positive tweets increased likes. Media (photo, gif, or video) presence increased likes. Among linguistic features, the number of hashtags and that of external links decreased likes, whereas the number of mentions increased likes. Account verification increased likes.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Linear regression models on predictors of popularity and virality of tweets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="480"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Variables</td>
                <td colspan="4">Ln (like count)<sup>a</sup> (n=286,657)</td>
                <td colspan="3">Ln (retweet count)<sup>a</sup> (n=168,961)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <italic>β</italic>
                </td>
                <td colspan="2"><italic>P</italic> value</td>
                <td colspan="2">
                  <italic>β</italic>
                </td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="10">
                  <bold>Topics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T1: Vaccine access</td>
                <td colspan="2">.029</td>
                <td colspan="2">.048</td>
                <td colspan="2">.062</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T2: Vaccine efficacy and rollout</td>
                <td colspan="2">.049</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.077</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T3: Vaccine development and people’s views</td>
                <td colspan="2">.055</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.078</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T4: Vaccination status</td>
                <td colspan="2">.048</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.068</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T5: Feeling and side effect</td>
                <td colspan="2">.040</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.052</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T6: Vaccine appointment</td>
                <td colspan="2">.027</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.033</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T7: Vaccine availability</td>
                <td colspan="2">.018</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.019</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T8: Vaccination eligibility</td>
                <td colspan="2">.011</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.006</td>
                <td colspan="2">.08</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T9: Age and issues</td>
                <td colspan="2">.009</td>
                <td colspan="2">.13</td>
                <td colspan="2">.009</td>
                <td colspan="2">.10</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T10: Preventive measures</td>
                <td colspan="2">–.030</td>
                <td colspan="2">.26</td>
                <td colspan="2">–.037</td>
                <td colspan="2">.25</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T11: Student and county</td>
                <td colspan="2">.076</td>
                <td colspan="2">.14</td>
                <td colspan="2">–.080</td>
                <td colspan="2">.14</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>T12: Trust and communication</td>
                <td colspan="2">–.079</td>
                <td colspan="2">.11</td>
                <td colspan="2">–.072</td>
                <td colspan="2">.21</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Emotion (valence)</td>
                <td colspan="2">.059</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.0003</td>
                <td>.93</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Media presence</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Has photo</td>
                <td colspan="2">.188</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.088</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Has gif</td>
                <td colspan="2">.019</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.001</td>
                <td colspan="2">.64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Has video</td>
                <td colspan="2">.100</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.084</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Linguistic features</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of hashtags</td>
                <td colspan="2">–.072</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">–.059</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of mentions</td>
                <td colspan="2">.007</td>
                <td colspan="2">.005</td>
                <td colspan="2">–.002</td>
                <td colspan="2">.45</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of external links</td>
                <td colspan="2">–.126</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.003</td>
                <td colspan="2">.18</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Verified account</td>
                <td colspan="2">.452</td>
                <td colspan="2">&#60;.001</td>
                <td colspan="2">.378</td>
                <td>&#60;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>To account for the right skewness of the data distribution, the natural log–transformed like counts and retweet counts were used in the analyses.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Determinants of Retweet Counts</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> also reveals the effects of the four categories of independent variables on the log-transformed retweet counts. The regression model was significant at <italic>P</italic>&#60;.001 (adjusted <italic>R<sup>2</sup></italic>=0.130). RQ2 focused on the determinants of retweets. Out of the 12 latent topics identified by topic modeling, Topics 1 to 7 had weak but significant effects on retweets. The valence had no effect on retweets. Media presence of a photo or video increased retweets. Among linguistic features, the number of hashtags decreased retweets. Account verification increased retweets.</p>
      </sec>
      <sec>
        <title>Topic and Tweet Relationship Networks</title>
        <p>RQ3 focused on salient topics among the most liked tweets. As shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>, among the 2500 most liked tweets, Louvain clustering identified 4 out of the 12 topics. The tweets were clustered around vaccine access (Topic 1), followed closely by vaccine efficacy and rollout (Topic 2) and then vaccine development and people’s views (Topic 3). The other topics were not salient and presented as one remaining cluster. Each topic community was represented by one color.</p>
        <p><xref ref-type="table" rid="table3">Table 3</xref> summarizes the top 10 liked paraphrased tweets, like counts, dominant topics, and topic loadings. The first most liked tweet, which was posted in July 2020 and had 91,163 likes as of April 30, 2021, was clustered around vaccine access (Topic 1). It called for Medicare for All along with free COVID testing, treatment, and vaccines.</p>
        <p>RQ4 focused on salient topics of the most retweeted tweets. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>, among the top 2500 most retweeted tweets, Louvain clustering identified 5 out of the 12 topics the LDA identified in the total tweets. The top retweeted tweets mostly clustered around vaccine efficacy and rollout (Topic 2), closely followed by access to vaccine (Topic 1), and then vaccine development and people’s views (Topic 3) and vaccination status (Topic 5). The other topics were not salient and presented as one remaining cluster. Each topic community was represented by one color.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Topic communities of the 2500 most liked tweets. Two-mode visualization was used to present the relationship between topics and the 2500 most liked tweets. The topics and the tweets are connected by edges weighted by topic loadings of each tweet. Each topic node with its name is sized in proportion to the sum of topic loadings of all tweets. Colors indicate topic communities as partitioned by the Louvain algorithm.</p>
          </caption>
          <graphic xlink:href="publichealth_v7i12e32814_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Top 10 liked paraphrased tweets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="60"/>
            <col width="90"/>
            <col width="490"/>
            <col width="230"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Like rank</td>
                <td>Like count</td>
                <td>Tweet</td>
                <td>Dominant topic number and label</td>
                <td>Dominant topic loading</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>91,163</td>
                <td>Medicare for All along with free COVID testing, treatment, and vaccines are necessities of a decent society (July 2020).<sup>a</sup></td>
                <td>Topic 1: Vaccine access</td>
                <td>0.518</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>90,177</td>
                <td>Trump’s attempt to deny vaccines to New York is playing politics with people’s lives (November 2020).<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.578</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>63,681</td>
                <td>I participated in Moderna experiments to see if its vaccine and booster were safe and effective (April 2021)</td>
                <td>Topic 3: Vaccine development and people’s views</td>
                <td>0.373</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>55,223</td>
                <td>President Biden took credit for the vaccine from President Trump (March 2021)<sup>a</sup></td>
                <td>Topic 1: Vaccine access</td>
                <td>0.964</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>48,631</td>
                <td>The number of vaccine doses administered outnumbered that of new cases at a 10-to-1 ratio (February 2021)</td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.514</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>46,997</td>
                <td>I had ended my support for Trump and started taking COVID seriously. I got vaccinated, thanks to Biden and health workers (March 2021)</td>
                <td>Topic 4: Vaccination status</td>
                <td>0.578</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>36,753</td>
                <td>Like with smallpox, vaccinations along with surveillance and contact tracing are essential to COVID’s elimination (April 2020)<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.547</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>36,250</td>
                <td>Pfizer’s mRNA vaccine candidate showed initial evidence of efficacy (November 2020)<sup>a</sup></td>
                <td>Topic 3: Vaccine development and people’s views</td>
                <td>0.844</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>35,604</td>
                <td>President Trump delivered on his goal of having a safe and effective COVID vaccine by the end of the year (May 2020)</td>
                <td>Topic 3: Vaccine development and people’s views</td>
                <td>0.533</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>35,514</td>
                <td>The current vaccination pace will take 10 years to reach herd immunity. We need to speed this up (December 2020)<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.385</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Tweet was among the top 10 liked and concurrently one of the top 10 retweeted tweets.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Topic communities of the 2500 most retweeted tweets. Two-mode visualization was used to present the relationship between topics and the 2500 most retweeted tweets. The topics and the tweets are connected by edges weighted by topic loadings of each tweet. Each topic node with its name is sized in proportion to the sum of topic loadings of all tweets. Colors indicate topic communities as partitioned by the Louvain algorithm.</p>
          </caption>
          <graphic xlink:href="publichealth_v7i12e32814_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table4">Table 4</xref> summarizes the top 10 retweeted paraphrased tweets, their retweet counts, and dominant topics. The first most retweeted tweet, which was posted in December 2020 and garnered 17,427 retweets through April 2021, clustered around vaccine efficacy and rollout (Topic 2). This emphasized the long time needed to reach herd immunity based on the vaccination pace at that time.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Top 10 retweeted paraphrased tweets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="70"/>
            <col width="90"/>
            <col width="480"/>
            <col width="230"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Retweet rank</td>
                <td>Retweet count</td>
                <td>Tweet</td>
                <td>Dominant topic number and label</td>
                <td>Dominant topic loading</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>17,427</td>
                <td>The current vaccination pace will take 10 years to reach herd immunity. We need to speed this up (December 2020)<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.385</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>16,288</td>
                <td>Medicare for All along with free COVID testing, treatment, and vaccines are necessities of a decent society (July 2020)<sup>a</sup></td>
                <td>Topic 1: Vaccine access</td>
                <td>0.518</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>15,575</td>
                <td>Trump’s attempt to deny vaccines to New York is playing politics with people’s lives (November 2020)<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.578</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>14,536</td>
                <td>The FDA<sup>b</sup> and CDC<sup>c</sup> recommend a pause in the use of the Johnson &#38; Johnson COVID19 vaccine (April 2021)</td>
                <td>Topic 1: Vaccine access</td>
                <td>0.417</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>12,473</td>
                <td>Pfizer’s mRNA vaccine candidate showed initial evidence of efficacy (November 2020)<sup>a</sup></td>
                <td>Topic 3: Vaccine development and people’s views</td>
                <td>0.844</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>11,684</td>
                <td>President Biden took credit for the vaccine from President Trump (March 2021)<sup>a</sup></td>
                <td>Topic 1: Vaccine access</td>
                <td>0.964</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>11,046</td>
                <td>Russian vaccine trial shows high efficacy (February 2021)</td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.618</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>10,151</td>
                <td>UK’s vaccine is safe and induces an immune reaction (July 2020)</td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.844</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>8586</td>
                <td>Like with smallpox, vaccinations along with surveillance and contact tracing are essential to COVID’s elimination (April 2020)<sup>a</sup></td>
                <td>Topic 2: Vaccine efficacy and rollout</td>
                <td>0.547</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>8282</td>
                <td>Why we need two doses of mRNA vaccines (April 2021)</td>
                <td>Topic 1: Vaccine access</td>
                <td>0.488</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Tweet was among the top 10 retweeted and concurrently one of the top 10 liked tweets.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>FDA: Food and Drug Administration.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>CDC: Centers for Disease Control and Prevention.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>This study investigated the combined effects of the three categories of message-level factors on the popularity and virality of tweets about COVID-19 vaccines using text-mining techniques. We also examined the topic communities of the most liked and most retweeted tweets using network analysis and visualization. In this section, we first discuss how text-mined topics and valence, together with autoextracted information about social media message features affected likes and retweets. We further discuss limitations and implications for the directions of vaccine campaigns.</p>
        <p>Out of the 12 latent topics identified by topic modeling, Topics 1-8 increased likes and Topics 1-7 increased retweets. Vaccine development and people’s views (Topic 3) had the largest positive impact on likes and retweets, as reflected by <italic>β</italic> coefficients. The intrinsic novelty feature of COVID-19 vaccines could provide plausible explanations. The vaccines were newly developed to help fight off the new coronavirus, and two out of the four brands examined in the study used mRNA, a technology that had not been approved previously for general use in humans [<xref ref-type="bibr" rid="ref5">5</xref>]. Therefore, information about vaccine development and technology was more popular and viral. Relatedly, 3 out of the top 10 liked tweets reflected Topic 3, two of which were about mRNA vaccines. One out of the top 10 retweeted tweets reflected Topic 3, which was about mRNA vaccines. The findings were consistent with those in past research that suggested the impact of novel content in the social transmission of health news [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Vaccine efficacy and rollout (Topic 2) had the second largest positive impact on likes and retweets, as indicated by <italic>β</italic> coefficients. Prior research revealed the impact of efficacy information on the virality of online health news [<xref ref-type="bibr" rid="ref26">26</xref>] and in tweets about the COVID-19 pandemic [<xref ref-type="bibr" rid="ref25">25</xref>]. This study also underscores the importance of efficacy information on the virality of tweets about COVID-19 vaccines.</p>
        <p>The findings suggest that tweets focusing on the topic of vaccine development and people’s views, and the topic of vaccine efficacy and rollout highly meet the public’s needs for information during the COVID-19 pandemic, and therefore tend to become popular and viral on Twitter. It is plausible that these tweets provide useful and novel information that help to reduce uncertainty in a health crisis. Vaccine campaigns could provide more information about these topics to help the diffusion of information on social media.</p>
        <p>It is notable that polarized political information such as that supporting a political party could be intertwined with different topics. Polarized political information was contained in 5 out of the top 10 liked tweets and in 3 out of the top 10 retweeted tweets. As political stance may play a role in the vaccine debate in the United States [<xref ref-type="bibr" rid="ref9">9</xref>], it would be interesting for future studies to investigate its impact in addition to other factors.</p>
        <p>This study showed that the overall valence of the tweets was positive. This was consistent with findings in prior research on tweets about vaccines in general [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>] and about COVID-19 vaccines in particular, regardless of country [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. The results showed that positive valence increased likes. This is in alignment with findings in prior research [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. In comparison, the results showed no impact of valence on retweets. Past research revealed mixed findings regarding the effects of valence on retweets [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. The explanation may rest in the complex cognitive sources underlying retweeting behavior. Compared with liking, retweeting is a more social behavior that may involve expected reactions from recipients about the content and/or the sender [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Regarding social media message features, account verification had the largest positive impact on likes and retweets among all factors, as reflected by <italic>β</italic> coefficients. This finding underscores the importance of account authentication in the popularity and virality of tweets in the face of massive amounts of information. Credible information is vital to reduce uncertainty in a crisis according to the uncertainty reduction theory [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. However, it is notable that account authentication does not always mean content authentication. Accordingly, misinformation spread by verified accounts could pose greater challenges to vaccine campaigns. Vaccine campaigns could try to use and motivate different verified accounts, including institutional and individual accounts, to share credible information for wider reach and to prevent the spread of misinformation.</p>
        <p>Furthermore, in alignment with the literature [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], the presence of a photo or video enhanced likes and retweets. The presence of a gif increased likes but did not affect retweets. In addition, consistent with the literature [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], the number of hashtags decreased likes and retweets. The number of external links decreased likes, but did not affect retweets. Inconsistent with the literature [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>], the number of mentions facilitated likes, but did not affect retweets.</p>
        <p>The results revealed that among the examined factors, more could impact likes than retweets. Eight topics predicted likes, whereas seven predicted retweets. Valence predicted likes but did not predict retweets. The presence of a gif, the number of mentions, and the number of external links predicted likes but not retweets. A comparison between like counts of the top 10 liked tweets and retweet counts of the top 10 retweeted tweets also suggested that a tweet was much more likely to be liked than to be retweeted. The number of likes for the highest liked tweet was more than five times the number of retweets for the highest retweeted tweet. These findings indicate more challenges to make a tweet viral than popular.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several limitations. We used machine-based text mining to identify the underlying topics and valence in the vast amounts of tweets about COVID-19 vaccines. We then included the text-mined topics and valence, together with autoextracted information of social media message features in the regression models for prediction of the popularity and virality of tweets. Although this approach reduced manual coding, the results were mostly limited to autoidentified and autoextracted factors. Our manual reviews of sample tweets in each topic as well as the top 10 liked and retweeted tweets provided clues that politically polarized information could be intertwined with different topics. It would be interesting for future research to investigate how this may affect the popularity and virality of tweets. For instance, retweeting could derive from complex cognitive sources such as self-presentation [<xref ref-type="bibr" rid="ref31">31</xref>] and identity communication [<xref ref-type="bibr" rid="ref27">27</xref>]. A question arises whether consistency in the political stance between the sender and the recipients impact retweets.</p>
        <p>Furthermore, the findings were limited to US-based public discourse about COVID-19 vaccines on Twitter. Social media platforms have played an important role in disseminating information and opinions during the COVID-19 pandemic [<xref ref-type="bibr" rid="ref56">56</xref>]. It would be interesting for future research to compare Twitter with other social media platforms. For instance, the relative significance of examined factors in predicting popularity and virality may vary depending on the social media platform analyzed, as each has its own features.</p>
        <p>Finally, the results revealed message-level drivers of the popularity and virality of tweets about COVID-19 vaccines. We included account verification as an independent variable in the regression models and the results showed that it had a positive impact on likes and retweets. However, we did not identify social bots in the massive amounts of tweets. It would be interesting for future studies to investigate the impact of social bots.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study suggests the public interest in and demand for information about vaccine development and people’s views, as well as vaccine efficacy and rollout during the COVID-19 pandemic. These topics, along with the use of media and verified accounts, enhance the popularity and virality of tweets. These issues could be addressed in vaccine campaigns to help the diffusion of content on Twitter.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BOW</term>
          <def>
            <p>bag of words</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CDC</term>
          <def>
            <p>Centers for Disease Control and Prevention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">mRNA</term>
          <def>
            <p>messenger RNA</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>WHO Director-General's opening remarks at the media briefing on COVID-19 - 11 March</article-title>
          <source>World Health Organization</source>
          <year>2020</year>
          <month>03</month>
          <day>11</day>
          <access-date>2020-03-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/director-general/speeches/detail/who-director-general-s-opening-remarks-at-the-media-briefing-on-covid-19---11-march-2020">https://www.who.int/director-general/speeches/detail/who-director-general-s-opening-remarks-at-the-media-briefing-on-covid-19---11-march-2020</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 Dashboard</article-title>
          <source>Johns Hopkins University</source>
          <access-date>2021-04-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://coronavirus.jhu.edu/map.html">https://coronavirus.jhu.edu/map.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 vaccines</article-title>
          <source>World Health Organization</source>
          <year>2021</year>
          <access-date>2021-07-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/emergencies/diseases/novel-coronavirus-2019/covid-19-vaccines">https://www.who.int/emergencies/diseases/novel-coronavirus-2019/covid-19-vaccines</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>Science brief: COVID-19 vaccines and vaccination</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2021</year>
          <month>07</month>
          <day>27</day>
          <access-date>2021-07-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/science/science-briefs/fully-vaccinated-people.html">https://www.cdc.gov/coronavirus/2019-ncov/science/science-briefs/fully-vaccinated-people.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <source>The lightning-fast quest for COVID vaccines—and what it means for other diseases</source>
          <year>2020</year>
          <month>12</month>
          <day>18</day>
          <access-date>2020-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/d41586-020-03626-1">https://www.nature.com/articles/d41586-020-03626-1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zipkin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>New vaccine approaches present new possibilities, but new challenges</source>
          <year>2021</year>
          <month>06</month>
          <day>01</day>
          <access-date>2021-06-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/d43747-021-00079-x">https://www.nature.com/articles/d43747-021-00079-x</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iannelli</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <source>An overview of the vaccine debate: looking at both sides of the argument</source>
          <year>2021</year>
          <month>06</month>
          <day>04</day>
          <access-date>2021-06-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.verywellhealth.com/the-vaccine-debate-2633685">https://www.verywellhealth.com/the-vaccine-debate-2633685</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kerr</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Panagopoulos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>van der Linden</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Political polarization on COVID-19 pandemic response in the United States</article-title>
          <source>Person Ind Diff</source>
          <year>2021</year>
          <month>09</month>
          <volume>179</volume>
          <fpage>110892</fpage>
          <pub-id pub-id-type="doi">10.1016/j.paid.2021.110892</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fridman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gershon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gneezy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 and vaccine hesitancy: A longitudinal study</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <month>4</month>
          <day>16</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>e0250123</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0250123"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0250123</pub-id>
          <pub-id pub-id-type="medline">33861765</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-35660</pub-id>
          <pub-id pub-id-type="pmcid">PMC8051771</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Why the COVID-19 vaccine distribution has gotten off to a slow start</source>
          <year>2021</year>
          <month>01</month>
          <day>01</day>
          <access-date>2021-01-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.npr.org/2021/01/01/952652202/why-the-covid-19-vaccine-distribution-has-gotten-off-to-a-slow-start">https://www.npr.org/2021/01/01/952652202/why-the-covid-19-vaccine-distribution-has-gotten-off-to-a-slow-start</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blankenship</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Goff</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tse</surname>
              <given-names>ZTH</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Saroha</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fung</surname>
              <given-names>ICH</given-names>
            </name>
          </person-group>
          <article-title>Sentiment, contents, and retweets: a study of two vaccine-related Twitter datasets</article-title>
          <source>Perm J</source>
          <year>2018</year>
          <volume>22</volume>
          <fpage>17</fpage>
          <lpage>138</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29911966"/>
          </comment>
          <pub-id pub-id-type="doi">10.7812/TPP/17-138</pub-id>
          <pub-id pub-id-type="medline">29911966</pub-id>
          <pub-id pub-id-type="pii">17-138</pub-id>
          <pub-id pub-id-type="pmcid">PMC6004971</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gunaratne</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Coomes</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Haghbayan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Temporal trends in anti-vaccine discourse on Twitter</article-title>
          <source>Vaccine</source>
          <year>2019</year>
          <month>08</month>
          <day>14</day>
          <volume>37</volume>
          <issue>35</issue>
          <fpage>4867</fpage>
          <lpage>4871</lpage>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2019.06.086</pub-id>
          <pub-id pub-id-type="medline">31300292</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(19)30876-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Love</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Himelboim</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Holton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Twitter as a source of vaccination information: content drivers and what they are saying</article-title>
          <source>Am J Infect Control</source>
          <year>2013</year>
          <month>06</month>
          <volume>41</volume>
          <issue>6</issue>
          <fpage>568</fpage>
          <lpage>570</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ajic.2012.10.016</pub-id>
          <pub-id pub-id-type="medline">23726548</pub-id>
          <pub-id pub-id-type="pii">S0196-6553(12)01371-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ortiz-Sánchez</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Velando-Soriano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pradas-Hernández</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vargas-Román</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gómez-Urquiza</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Cañadas-De la Fuente</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Albendín-García</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Analysis of the anti-vaccine movement in social networks: a systematic review</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>07</month>
          <day>27</day>
          <volume>17</volume>
          <issue>15</issue>
          <fpage>5394</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17155394"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17155394</pub-id>
          <pub-id pub-id-type="medline">32727024</pub-id>
          <pub-id pub-id-type="pii">ijerph17155394</pub-id>
          <pub-id pub-id-type="pmcid">PMC7432886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tahir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gogate</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dashtipour</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-enabled analysis of public attitudes on Facebook and Twitter toward COVID-19 vaccines in the United Kingdom and the United States: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>05</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e26627</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e26627/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26627</pub-id>
          <pub-id pub-id-type="medline">33724919</pub-id>
          <pub-id pub-id-type="pii">v23i4e26627</pub-id>
          <pub-id pub-id-type="pmcid">PMC8023383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Luli</surname>
              <given-names>GK</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine-related discussion on Twitter: topic modeling and sentiment analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>06</month>
          <day>29</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e24435</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e24435/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24435</pub-id>
          <pub-id pub-id-type="medline">34115608</pub-id>
          <pub-id pub-id-type="pii">v23i6e24435</pub-id>
          <pub-id pub-id-type="pmcid">PMC8244724</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-Alrazaq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alhuwail</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Househ</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hamdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Top concerns of Tweeters during the COVID-19 pandemic: infoveillance study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>21</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e19016</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e19016/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19016</pub-id>
          <pub-id pub-id-type="medline">32287039</pub-id>
          <pub-id pub-id-type="pii">v22i4e19016</pub-id>
          <pub-id pub-id-type="pmcid">PMC7175788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Valkunde</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Moustakas</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Topics, trends, and sentiments of tweets about the COVID-19 pandemic: temporal infoveillance study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>10</month>
          <day>23</day>
          <volume>22</volume>
          <issue>10</issue>
          <fpage>e22624</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/10/e22624/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22624</pub-id>
          <pub-id pub-id-type="medline">33006937</pub-id>
          <pub-id pub-id-type="pii">v22i10e22624</pub-id>
          <pub-id pub-id-type="pmcid">PMC7588259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doogan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Buntine</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Linger</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brunt</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Public perceptions and attitudes toward COVID-19 nonpharmaceutical interventions across six countries: a topic modeling analysis of Twitter data</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>09</month>
          <day>03</day>
          <volume>22</volume>
          <issue>9</issue>
          <fpage>e21419</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/9/e21419/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21419</pub-id>
          <pub-id pub-id-type="medline">32784190</pub-id>
          <pub-id pub-id-type="pii">v22i9e21419</pub-id>
          <pub-id pub-id-type="pmcid">PMC7505256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwok</surname>
              <given-names>SWH</given-names>
            </name>
            <name name-style="western">
              <surname>Vadde</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Tweet topics and sentiments relating to COVID-19 vaccination among Australian Twitter users: machine learning analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>05</month>
          <day>19</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>e26953</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/5/e26953/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26953</pub-id>
          <pub-id pub-id-type="medline">33886492</pub-id>
          <pub-id pub-id-type="pii">v23i5e26953</pub-id>
          <pub-id pub-id-type="pmcid">PMC8136408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Akinwunmi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>CJP</given-names>
            </name>
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Health communication through news media during the early stage of the COVID-19 outbreak in China: digital topic modeling approach</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>28</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e19118</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e19118/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19118</pub-id>
          <pub-id pub-id-type="medline">32302966</pub-id>
          <pub-id pub-id-type="pii">v22i4e19118</pub-id>
          <pub-id pub-id-type="pmcid">PMC7189789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>IB</given-names>
            </name>
          </person-group>
          <article-title>Predicting positive user responses to social media advertising: The roles of emotional appeal, informativeness, and creativity</article-title>
          <source>Int J Inf Manag</source>
          <year>2016</year>
          <month>06</month>
          <volume>36</volume>
          <issue>3</issue>
          <fpage>360</fpage>
          <lpage>373</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijinfomgt.2016.01.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pancer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Poole</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The popularity and virality of political social media: hashtags, mentions, and links predict likes and retweets of 2016 U.S. presidential nominees’ tweets</article-title>
          <source>Soc Influ</source>
          <year>2016</year>
          <month>12</month>
          <day>12</day>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>259</fpage>
          <lpage>270</lpage>
          <pub-id pub-id-type="doi">10.1080/15534510.2016.1265582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <article-title>Using Twitter</article-title>
          <source>Twitter</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://help.twitter.com/en/using-twitter/">https://help.twitter.com/en/using-twitter/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nanath</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Joy</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Leveraging Twitter data to analyze the virality of Covid-19 tweets: a text mining approach</article-title>
          <source>Behav Inf Technol</source>
          <year>2021</year>
          <month>06</month>
          <day>17</day>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1080/0144929x.2021.1941259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HS</given-names>
            </name>
          </person-group>
          <article-title>Attracting views and going viral: how message features and news-sharing channels affect health news diffusion</article-title>
          <source>J Commun</source>
          <year>2015</year>
          <month>06</month>
          <day>01</day>
          <volume>65</volume>
          <issue>3</issue>
          <fpage>512</fpage>
          <lpage>534</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26441472"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jcom.12160</pub-id>
          <pub-id pub-id-type="medline">26441472</pub-id>
          <pub-id pub-id-type="pmcid">PMC4591750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Milkman</surname>
              <given-names>KL</given-names>
            </name>
          </person-group>
          <article-title>What makes online content viral?</article-title>
          <source>J Market Res</source>
          <year>2012</year>
          <month>04</month>
          <day>01</day>
          <volume>49</volume>
          <issue>2</issue>
          <fpage>192</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.1509/jmr.10.0353</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moriarty</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Stryker</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Prevention and screening efficacy messages in newspaper accounts of cancer</article-title>
          <source>Health Educ Res</source>
          <year>2008</year>
          <month>06</month>
          <day>01</day>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>487</fpage>
          <lpage>498</lpage>
          <pub-id pub-id-type="doi">10.1093/her/cyl163</pub-id>
          <pub-id pub-id-type="medline">17289658</pub-id>
          <pub-id pub-id-type="pii">cyl163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCormack</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Squiers</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Frasier</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bann</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>MacDonald</surname>
              <given-names>PDM</given-names>
            </name>
          </person-group>
          <article-title>Gaps in knowledge about COVID-19 among US residents early in the outbreak</article-title>
          <source>Public Health Rep</source>
          <year>2021</year>
          <month>11</month>
          <day>11</day>
          <volume>136</volume>
          <issue>1</issue>
          <fpage>107</fpage>
          <lpage>116</lpage>
          <pub-id pub-id-type="doi">10.1177/0033354920970182</pub-id>
          <pub-id pub-id-type="medline">33176108</pub-id>
          <pub-id pub-id-type="pmcid">PMC7856374</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The impact of language on retweeting during acute natural disasters: uncertainty reduction and language expectancy perspectives</article-title>
          <source>Ind Manag Data Syst</source>
          <year>2020</year>
          <month>06</month>
          <day>29</day>
          <volume>120</volume>
          <issue>8</issue>
          <fpage>1501</fpage>
          <lpage>1519</lpage>
          <pub-id pub-id-type="doi">10.1108/imds-12-2019-0711</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wojnicki</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Godes</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Word-of-mouth as self-enhancement</article-title>
          <source>SSRN J</source>
          <year>2008</year>
          <month>04</month>
          <day>28</day>
          <fpage>06-01</fpage>
          <pub-id pub-id-type="doi">10.2139/ssrn.908999</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arieh</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Algom</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Processing picture-word stimuli: the contingent nature of picture and of word superiority</article-title>
          <source>J Exp Psychol Learn Mem Cogn</source>
          <year>2002</year>
          <month>01</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>221</fpage>
          <lpage>232</lpage>
          <pub-id pub-id-type="doi">10.1037/0278-7393.28.1.221</pub-id>
          <pub-id pub-id-type="medline">11827082</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shaki</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Algom</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The locus and nature of semantic congruity in symbolic comparison: evidence from the Stroop effect</article-title>
          <source>Mem Cognit</source>
          <year>2002</year>
          <month>01</month>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.3758/bf03195260</pub-id>
          <pub-id pub-id-type="medline">11958352</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reber</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarz</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Winkielman</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Processing fluency and aesthetic pleasure: is beauty in the perceiver's processing experience?</article-title>
          <source>Pers Soc Psychol Rev</source>
          <year>2004</year>
          <month>12</month>
          <day>21</day>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>364</fpage>
          <lpage>382</lpage>
          <pub-id pub-id-type="doi">10.1207/s15327957pspr0804_3</pub-id>
          <pub-id pub-id-type="medline">15582859</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alter</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Oppenheimer</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Uniting the tribes of fluency to form a metacognitive nation</article-title>
          <source>Pers Soc Psychol Rev</source>
          <year>2009</year>
          <month>08</month>
          <day>28</day>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>219</fpage>
          <lpage>235</lpage>
          <pub-id pub-id-type="doi">10.1177/1088868309341564</pub-id>
          <pub-id pub-id-type="medline">19638628</pub-id>
          <pub-id pub-id-type="pii">1088868309341564</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>Relaunching verification and what's next Twitter</article-title>
          <source>Twitter</source>
          <year>2021</year>
          <month>5</month>
          <day>20</day>
          <access-date>2021-05-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://blog.twitter.com/en_us/topics/company/2021/relaunching-verification-and-whats-next">https://blog.twitter.com/en_us/topics/company/2021/relaunching-verification-and-whats-next</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <article-title>snscrape</article-title>
          <source>GitHub</source>
          <access-date>2021-04-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/JustAnotherArchivist/snscrape">https://github.com/JustAnotherArchivist/snscrape</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Leader</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yom-Tov</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Budenz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Klassen</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Applying multiple data collection tools to quantify human papillomavirus vaccine communication on Twitter</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>12</month>
          <day>05</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e318</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e318/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6670</pub-id>
          <pub-id pub-id-type="medline">27919863</pub-id>
          <pub-id pub-id-type="pii">v18i12e318</pub-id>
          <pub-id pub-id-type="pmcid">PMC5168526</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Kearney</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Hauer</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Selvan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Koku</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Leader</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Dimensions of misinformation about the HPV vaccine on Instagram: content and network analysis of social media characteristics</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>12</month>
          <day>03</day>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>e21451</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/12/e21451/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21451</pub-id>
          <pub-id pub-id-type="medline">33270038</pub-id>
          <pub-id pub-id-type="pii">v22i12e21451</pub-id>
          <pub-id pub-id-type="pmcid">PMC7746500</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <article-title>Different COVID-19 vaccines</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2021</year>
          <month>05</month>
          <day>27</day>
          <access-date>2021-06-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/vaccines/different-vaccines.html">https://www.cdc.gov/coronavirus/2019-ncov/vaccines/different-vaccines.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <article-title>Safe COVID-19 vaccines for Europeans</article-title>
          <source>European Commission</source>
          <year>2021</year>
          <access-date>2021-04-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ec.europa.eu/info/live-work-travel-eu/coronavirus-response/safe-covid-19-vaccines-europeans_en">https://ec.europa.eu/info/live-work-travel-eu/coronavirus-response/safe-covid-19-vaccines-europeans_en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rehurek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Gensim—statistical semantics in Python</article-title>
          <year>2011</year>
          <conf-name>European meeting on Python in Science</conf-name>
          <conf-date>August 25-28, 2011</conf-date>
          <conf-loc>Paris, France</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Raghavan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schutze</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>Introduction to Information Retrieval</source>
          <year>2008</year>
          <publisher-loc>Cambridge, UK</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>NLTK: the natural language toolkit</article-title>
          <year>2002</year>
          <conf-name>Association for Computational Linguistics-02 Workshop on Effective tools and methodologies for teaching natural language processing and computational linguistics</conf-name>
          <conf-date>July 2002</conf-date>
          <conf-loc>Morristown, NJ</conf-loc>
          <fpage>63</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.3115/1118108.1118117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <month>03</month>
          <day>01</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <pub-id pub-id-type="doi">10.5555/944919.944937</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allahyari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pouriyeh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Assefi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Safaei</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Trippe</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Kochut</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Text summarization techniques: a brief survey</article-title>
          <source>Int J Adv Comput Sci Appl</source>
          <year>2017</year>
          <volume>8</volume>
          <issue>10</issue>
          <fpage>397</fpage>
          <lpage>405</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://thesai.org/Publications/ViewPaper?Volume=8&#38;Issue=10&#38;Code=IJACSA&#38;SerialNo=52"/>
          </comment>
          <pub-id pub-id-type="doi">10.14569/ijacsa.2017.081052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maier</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Waldherr</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miltner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wiedemann</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Niekler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Keinert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pfetsch</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Heyer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Reber</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Häussler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid-Petri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Applying LDA topic modeling in communication research: toward a valid and reliable methodology</article-title>
          <source>Commun Method  Meas</source>
          <year>2018</year>
          <month>02</month>
          <day>16</day>
          <volume>12</volume>
          <issue>2-3</issue>
          <fpage>93</fpage>
          <lpage>118</lpage>
          <pub-id pub-id-type="doi">10.1080/19312458.2018.1430754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sievert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shirley</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>LDAvis: a method for visualizing and interpreting topics</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the Workshop on Interactive Language Learning, Visualization, Interfaces at the Association for Computational Linguistics</conf-name>
          <conf-date>Jun 2014</conf-date>
          <conf-loc>Baltimore, MD</conf-loc>
          <pub-id pub-id-type="doi">10.13140/2.1.1394.3043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <source>TextBlob: simplified text processing</source>
          <access-date>2021-01-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://textblob.readthedocs.io/">https://textblob.readthedocs.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <source>Gephi. Version 0.9.2</source>
          <access-date>2021-04-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gephi.org/">https://gephi.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>MEJ</given-names>
            </name>
            <name name-style="western">
              <surname>Girvan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Finding and evaluating community structure in networks</article-title>
          <source>Phys Rev E</source>
          <year>2004</year>
          <month>2</month>
          <day>26</day>
          <volume>69</volume>
          <issue>2</issue>
          <fpage>026113</fpage>
          <pub-id pub-id-type="doi">10.1103/physreve.69.026113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fortunato</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Community detection in graphs</article-title>
          <source>Phys Rep</source>
          <year>2010</year>
          <month>2</month>
          <volume>486</volume>
          <issue>3-5</issue>
          <fpage>75</fpage>
          <lpage>174</lpage>
          <pub-id pub-id-type="doi">10.1016/j.physrep.2009.11.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ewing-Nelson</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schlitt</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Marathe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abbas</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Swarup</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Semantic network analysis of vaccine sentiment in online social media</article-title>
          <source>Vaccine</source>
          <year>2017</year>
          <month>06</month>
          <day>22</day>
          <volume>35</volume>
          <issue>29</issue>
          <fpage>3621</fpage>
          <lpage>3638</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28554500"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2017.05.052</pub-id>
          <pub-id pub-id-type="medline">28554500</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(17)30688-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC5548132</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Röder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Both</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hinneburg</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploring the space of topic coherence measures</article-title>
          <year>2015</year>
          <conf-name>Proceedings of the 8th ACM International Conference on Web Search and Data Mining</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <fpage>399</fpage>
          <lpage>408</lpage>
          <pub-id pub-id-type="doi">10.1145/2684822.2685324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Bradac</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <source>Language and social knowledge: uncertainty in interpersonal relations (Vol. 2)</source>
          <year>1982</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Hodder Education</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Lurie</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Social media and emergency preparedness in response to novel coronavirus</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>05</month>
          <day>26</day>
          <volume>323</volume>
          <issue>20</issue>
          <fpage>2011</fpage>
          <lpage>2012</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.4469</pub-id>
          <pub-id pub-id-type="medline">32202611</pub-id>
          <pub-id pub-id-type="pii">2763596</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
