<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v2i2e161</article-id>
    <article-id pub-id-type="pmid">27765731</article-id>
    <article-id pub-id-type="doi">10.2196/publichealth.5901</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Evaluating Google, Twitter, and Wikipedia as Tools for Influenza Surveillance Using Bayesian Change Point Analysis: A Comparative Analysis</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Sullivan</surname>
          <given-names>Patrick</given-names>
        </name>
      </contrib>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Slok</surname>
          <given-names>Edwin</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Su</surname>
          <given-names>Wu-Chen</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Paul</surname>
          <given-names>Michael</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Broniatowski</surname>
          <given-names>David</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes">
      <name name-style="western">
        <surname>Sharpe</surname>
        <given-names>J Danielle</given-names>
      </name>
      <degrees>MS</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>Rollins School of Public Health</institution>
        <institution>Department of Epidemiology</institution>
        <institution>Emory University</institution>
        <addr-line>1518 Clifton Road NE</addr-line>
        <addr-line>Atlanta, GA, 30322</addr-line>
        <country>United States</country>
        <phone>1 912 399 2811</phone>
        <fax>1 404 727 8737</fax>
        <email>danielle.sharpe@emory.edu</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1898-6202</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Hopkins</surname>
          <given-names>Richard S</given-names>
        </name>
        <degrees>MSPH, MD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3765-8810</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Cook</surname>
          <given-names>Robert L</given-names>
        </name>
        <degrees>MPH, MD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7770-3754</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Striley</surname>
          <given-names>Catherine W</given-names>
        </name>
        <degrees>MPE, MSW, PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2973-7842</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>College of Public Health and Health Professions</institution>
    <institution>Department of Epidemiology</institution>  
    <institution>University of Florida</institution>  
    <addr-line>Gainesville, FL</addr-line>
    <country>United States</country></aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>Rollins School of Public Health</institution>
    <institution>Department of Epidemiology</institution>  
    <institution>Emory University</institution>  
    <addr-line>Atlanta, GA</addr-line>
    <country>United States</country></aff>
    <author-notes>
      <corresp>Corresponding Author: J Danielle Sharpe 
      <email>danielle.sharpe@emory.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Jul-Dec</season><year>2016</year></pub-date>
    <pub-date pub-type="epub">
      <day>20</day>
      <month>10</month>
      <year>2016</year>
    </pub-date>
    <volume>2</volume>
    <issue>2</issue>
    <elocation-id>e161</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>23</day>
        <month>4</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>27</day>
        <month>7</month>
        <year>2016</year>
      </date>
      <date date-type="rev-recd">
        <day>31</day>
        <month>8</month>
        <year>2016</year>
      </date>
      <date date-type="accepted">
        <day>21</day>
        <month>9</month>
        <year>2016</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©J Danielle Sharpe, Richard S Hopkins, Robert L Cook, Catherine W Striley. Originally published in JMIR Public Health and Surveillance (http://publichealth.jmir.org), 20.10.2016.</copyright-statement>
    <copyright-year>2016</copyright-year>
    <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on http://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://publichealth.jmir.org/2016/2/e161/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Traditional influenza surveillance relies on influenza-like illness (ILI) syndrome that is reported by health care providers. It primarily captures individuals who seek medical care and misses those who do not. Recently, Web-based data sources have been studied for application to public health surveillance, as there is a growing number of people who search, post, and tweet about their illnesses before seeking medical care. Existing research has shown some promise of using data from Google, Twitter, and Wikipedia to complement traditional surveillance for ILI. However, past studies have evaluated these Web-based sources individually or dually without comparing all 3 of them, and it would be beneficial to know which of the Web-based sources performs best in order to be considered to complement traditional methods.</p>
        
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>The objective of this study is to comparatively analyze Google, Twitter, and Wikipedia by examining which best corresponds with Centers for Disease Control and Prevention (CDC) ILI data. It was hypothesized that Wikipedia will best correspond with CDC ILI data as previous research found it to be least influenced by high media coverage in comparison with Google and Twitter.</p>
        
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>Publicly available, deidentified data were collected from the CDC, Google Flu Trends, HealthTweets, and Wikipedia for the 2012-2015 influenza seasons. Bayesian change point analysis was used to detect seasonal changes, or change points, in each of the data sources. Change points in Google, Twitter, and Wikipedia that occurred during the exact week, 1 preceding week, or 1 week after the CDC’s change points were compared with the CDC data as the gold standard. All analyses were conducted using the R package “bcp” version 4.0.0 in RStudio version 0.99.484 (RStudio Inc). In addition, sensitivity and positive predictive values (PPV) were calculated for Google, Twitter, and Wikipedia.</p>
        
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>During the 2012-2015 influenza seasons, a high sensitivity of 92% was found for Google, whereas the PPV for Google was 85%. A low sensitivity of 50% was calculated for Twitter; a low PPV of 43% was found for Twitter also. Wikipedia had the lowest sensitivity of 33% and lowest PPV of 40%.</p>
        
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Of the 3 Web-based sources, Google had the best combination of sensitivity and PPV in detecting Bayesian change points in influenza-related data streams. Findings demonstrated that change points in Google, Twitter, and Wikipedia data occasionally aligned well with change points captured in CDC ILI data, yet these sources did not detect all changes in CDC data and should be further studied and developed.</p>
        
      </sec>
    </abstract>
    <kwd-group>
      <kwd>Internet</kwd>
      <kwd>social media</kwd>
      <kwd>Bayes theorem</kwd>
      <kwd>public health surveillance</kwd>
      <kwd>influenza, human</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Although largely vaccine-preventable, influenza places a burden on the US health care system, causing 3000-50,000 deaths annually [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. As one of the many influenza surveillance systems, the Centers for Disease Control and Prevention (CDC) monitors influenza activity by calculating the number of outpatient visits for the syndrome of influenza-like illness (ILI) reported by partnering health care providers to the US Outpatient ILI Surveillance Network (ILINet). The CDC defines ILI as a fever (≥100°F or 37.8°C) and a cough and sore throat without a known cause other than influenza [<xref ref-type="bibr" rid="ref3">3</xref>]. This approach to surveillance primarily captures information about people who seek medical care for their influenza symptoms, thus missing those who do not interact with the health care system. In addition, this surveillance method is limited by relatively dated technology and by delays of up to 1 to 2 weeks between the occurrence of the illness event and the dissemination of surveillance information [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        
        <p>Syndromic surveillance, which can be defined as the monitoring of disease syndromes in or near real time for early detection of outbreaks, has incorporated the use of novel data sources such as emergency department records and prescription sales to enhance traditional surveillance systems [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Recently, nontraditional data sources, particularly those that are Web-based, have come into greater application for public health surveillance. This is especially evident as individuals who experience various symptoms may search the Web for health-related information and share their illness experiences using social media platforms before seeking medical care. Using such Web-based data sources such as search queries and social media has been coined digital epidemiology [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Digital epidemiology can be less expensive, timelier, and can expand detection by increasing the range of health events that can be detected.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>As the number of Internet users has increased [<xref ref-type="bibr" rid="ref11">11</xref>], researchers have identified the use of Google, Twitter, and Wikipedia as novel surveillance approaches to complement traditional methods. Google Flu Trends, which monitors Google users’ searches for information related to influenza, has shown correlation with CDC influenza data, while delivering estimates 1 to 2 weeks ahead of CDC reports [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Although initially successful, the system has not been without its issues in more recent years. Google Flu Trends overestimated influenza activity during the 2012-2013 influenza season and underestimated it during the 2009 H1N1 influenza pandemic [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. One study found that both the original (2008) and revised (2009) algorithms for Google Flu Trends were not reliable on city, regional, and national scales, particularly in instances of varying intensity in influenza seasons and media coverage [<xref ref-type="bibr" rid="ref16">16</xref>]. Due to issues with its proprietary algorithm, Google Flu Trends was discontinued in August 2015 [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        
        <p>Influenza-related posts on Twitter, a social networking platform for disseminating short messages (tweets), have shown high correlation with reported ILI activity in ILINet [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Studies have found that Twitter data highly correlate with national- and city-level ILI counts [<xref ref-type="bibr" rid="ref20">20</xref>]. Signorini et al (2011) also demonstrated that tweets could be used to estimate ILI activity at regional and national levels within a reasonable margin of error [<xref ref-type="bibr" rid="ref21">21</xref>]. Moreover, studies have found that Twitter data perform better than Google data. Nagar et al (2014) conducted a study showing that tweets better reflected city-level ILI incidence in comparison with Google search queries [<xref ref-type="bibr" rid="ref22">22</xref>]. Aramaki et al discovered that a Twitter-based model outperformed a Google-based model during periods of normal news coverage, although the Twitter model performed less optimally during the periods of excessive media coverage [<xref ref-type="bibr" rid="ref23">23</xref>]. Moreover, geographic granularity can affect the performance of Twitter data. Broniatowski et al (2015) found that city-level Twitter data performed better than state- and national-level Twitter data, although Google Flu Trends data performed better at each level [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        
        <p>Wikipedia page view data have proven valuable for tracking trending topics as well as disease monitoring and forecasting [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. McIver and Brownstein (2014) reported that increases in the quantity of visits to influenza-related Wikipedia articles allowed for the estimation of influenza activity up to 2 weeks before ILINet, outperforming Google Flu Trends estimates during abnormal influenza seasons and periods of high media reporting [<xref ref-type="bibr" rid="ref27">27</xref>]. One study found that Wikipedia page view data have suitable forecasting value up until the peak of the influenza seasons [<xref ref-type="bibr" rid="ref26">26</xref>], whereas another study also reported that Wikipedia page view data are suitable for forecasting using a 28-day analysis as well as for nowcasting, or monitoring current disease incidence [<xref ref-type="bibr" rid="ref25">25</xref>]. However, as a disadvantage, the signal-to-noise ratio of Wikipedia data can be problematic [<xref ref-type="bibr" rid="ref25">25</xref>] as Wikipedia has become a preferred source for seeking health information whether an individual is ill or not [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. In addition, unlike the granularity flexibility of Google and Twitter data, Wikipedia does not have such capability of evaluating influenza activity at local or regional levels because it only provides counts of page views and no accompanying location or user information in its publicly available data.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>These early studies on Google, Twitter, and Wikipedia show that, in spite of some drawbacks, mining these Web-based sources may provide valuable epidemic intelligence by identifying indicators of influenza activity at times or in populations that are missed by more traditional surveillance systems. Previous studies have evaluated these 3 Web-based sources individually or dually against a standard, but have not compared all 3 of them with each other and a standard. This comparison is needed to understand if each of these Web-based sources accurately reflect seasonal changes, or change points, that occur in CDC ILI data. It would be beneficial to know which of these Web-based sources performs the best in order to be considered as a complement to traditional surveillance methods.</p>
        
        <p>Thus, this study aims to conduct a comparative analysis of using Google, Twitter, and Wikipedia for influenza surveillance by examining which Web-based source produces data that are most aligned with CDC ILI data. The specific research question is as follows: For which Web-based source—Google, Twitter, or Wikipedia—do detected change points most closely match change points detected in CDC ILI data for the 2012-2013, 2013-2014, and 2014-2015 influenza seasons? It is hypothesized that Wikipedia data will have the most change points in common with CDC ILI data due to McIver and Brownstein’s [<xref ref-type="bibr" rid="ref27">27</xref>] finding that Wikipedia data can be less influenced by media coverage in comparison with data from Google Flu Trends and Twitter [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <sec>
          <title>Study Period</title>
          <p>Data were retrospectively collected for the US-designated 2012-2013 influenza season (September 30, 2012 to May 18, 2013), 2013-2014 influenza season (September 29, 2013 to May 17, 2014), and 2014-2015 influenza season (September 28, 2014 to May 23, 2015) [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. This study period, that is 2012-2015, was chosen due to data constraints. The Twitter data from HealthTweets.org contained tweets dating back to November 2011. As we sought to analyze complete influenza seasons, we could not include the 2011-2012 influenza season, and therefore, any preceding seasons. In addition, we could not include data after the 2014-2015 influenza season because Google ceased making their Google Flu Trends data publicly available in August 2015.</p>
          
          <p>All data were presented as Morbidity and Mortality Weekly Report (MMWR) weeks. MMWR weeks start on Sunday and end on Saturday, ranging from 1 to 52 or 53 weeks [<xref ref-type="bibr" rid="ref33">33</xref>]. Each of the influenza seasons included in this study begins in MMWR week 40 of a year and ends in week 20 of the following year.</p>
          
        </sec>
        <sec>
          <title>CDC Data</title>
          <p>Data from the CDC ILINet system were downloaded from FluView Interactive, which provides weekly influenza surveillance information on outpatient illness, hospitalizations, pediatric mortality, virologic surveillance, and geographic activity [<xref ref-type="bibr" rid="ref34">34</xref>]. ILINet count data are aggregated by MMWR week. The ILINet system aggregates weekly information from participating health care providers on counts of patients seen for ILI by age group, total patients seen by age group, and corresponding year and week [<xref ref-type="bibr" rid="ref34">34</xref>]. Counts of ILI patient visits to the United States were used for this study. Although most prior studies used weighted ILI rates, we elected to use ILI counts. We decided to use CDC ILI count data to maintain unit comparison because we could not use the Bayesian change point analysis to transpose or model the Web-based count data to a similar scale as the CDC weighted ILI rates.</p>
          
        </sec>
        <sec>
          <title>Google Data</title>
          <p>Deidentified, national-level count data of influenza-related Google searches made in the United States were downloaded from the Google Flu Trends website [<xref ref-type="bibr" rid="ref17">17</xref>]. These data are the output of a CDC data-fitted regression model and are based on Google Flu Trends’ 2009 model (for the 2012-2013 influenza season), 2013 model (for the 2013-2014 influenza season), and 2014 model (for the 2014-2015 influenza model) [<xref ref-type="bibr" rid="ref17">17</xref>]. Count data from Google Flu Trends were already aggregated by MMWR week.</p>
          
        </sec>
        <sec>
          <title>Twitter Data</title>
          <p>For data from Twitter, deidentified, national-level count data of influenza-related tweets in the United States were downloaded from HealthTweets.org, a Johns Hopkins University-based repository of influenza-related tweets dating back to November 2011 [<xref ref-type="bibr" rid="ref35">35</xref>]. Using the Twitter application programming interface (API), the HealthTweets team collected influenza-related tweets from a keyword stream, which is 1% of public tweets [<xref ref-type="bibr" rid="ref35">35</xref>]. After collection, Dredze et al [<xref ref-type="bibr" rid="ref28">28</xref>] categorized the influenza-related tweets using automated annotators based on keywords, keyword combinations, and the classifier developed by Lamb and colleagues [<xref ref-type="bibr" rid="ref36">36</xref>]. Data from HealthTweets were also already aggregated by MMWR week.</p>
          
        </sec>
        <sec>
          <title>Wikipedia Data</title>
          <p>Wikipedia has made its article view data available for downloading through Wikimedia Statistics [<xref ref-type="bibr" rid="ref37">37</xref>]. Wikipedia article view data that are deidentified and aggregated were gathered for views on the “Influenza” article (English version). Count data from the English version of the “Influenza” article served as a proxy for U.S. national-level Wikipedia views. Wikipedia data are presented as the number of article views by the hour, including nonunique views [<xref ref-type="bibr" rid="ref37">37</xref>]. As Wikipedia article view data on the “Influenza” article are presented by the hour in Wikimedia Statistics, the data were aggregated by MMWR week before analysis.</p>
          
        </sec>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <sec>
          <title>Bayesian Change Point Analysis</title>
          <p>Bayesian change point analysis was the method used for this study. In essence, this technique detects inflections that signal a change within time series data, also known as change points. Bayesian change point analysis has been primarily used to detect when significant changes occur within datasets that have big data properties, such as volume, variety, and velocity [<xref ref-type="bibr" rid="ref38">38</xref>]. For instance, Bayesian change point analysis has been used to estimate when changes occurred in interest rate data [<xref ref-type="bibr" rid="ref39">39</xref>], chromosomal microarray data [<xref ref-type="bibr" rid="ref39">39</xref>], and cancer-related gene expression data [<xref ref-type="bibr" rid="ref40">40</xref>]. This method was used to detect changes in emergency department attendance and hospital admissions after a health system transformation in a post-earthquake area [<xref ref-type="bibr" rid="ref41">41</xref>]. Bayesian change point analysis has also been used to detect changes in the dynamics of an aquatic ecosystem such as the introduction of a nonnative species [<xref ref-type="bibr" rid="ref42">42</xref>]. Besides our study, this Bayesian technique has been used only once for influenza surveillance using ILI visits to emergency departments [<xref ref-type="bibr" rid="ref43">43</xref>], which is unlike our analysis in that we used Web-based data.</p><fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Simplified equation by Barry and Hartigan.</p>
            </caption>
            <graphic xlink:href="publichealth_v2i2e161_fig1.PNG" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          
          <p>Bayesian change point analysis formed the method of choice as it is one of the proven methods that can detect subtle changes in time series data more effectively than traditional aberration detection methods [<xref ref-type="bibr" rid="ref43">43</xref>]. Kass-Hout et al (2012) found that Bayesian change point analysis was not as sensitive as 2 other change point analysis methods—the cumulative sum technique and structural change model [<xref ref-type="bibr" rid="ref43">43</xref>]. However, Bayesian change point analysis has been best applied to microarray data [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>], which have big data properties similar to Web-based data. </p>
          
          <p>All Bayesian change point analyses were conducted using the R package “bcp” version 4.0.0 [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] in RStudio version 0.99.484 [<xref ref-type="bibr" rid="ref45">45</xref>]. The “bcp” package implements a complex Markov Chain Monte Carlo (MCMC) approximation [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] of the Bayesian change point method described by Barry and Hartigan [<xref ref-type="bibr" rid="ref46">46</xref>]. As the default for the “bcp” package, after 500 MCMC iterations, the probability of a change point at any given interval (ie, MMWR week) in time series data is computed from the number of times in the MCMC iterations that the condition of having a change point at that interval was met [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>].</p>
          
          <p>In each step of the Markov chain, the transition probability, <italic>p</italic>, for the conditional probability of a change point is found from the simplified equation by Barry and Hartigan [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref46">46</xref>], which is provided in <xref ref-type="fig" rid="figure1">Figure 1</xref>. After each MCMC iteration, the posterior means and probabilities are updated until the end of the time series. It is recommended that readers refer to Erdman and Emerson (2007), Erdman and Emerson (2008), and Barry and Hartigan (1993) for further mathematical explanation of this Bayesian method [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref46">46</xref>].</p>
          
        </sec>
        <sec>
          <title>Change Points</title>
          <p>We considered significant change points to be where the Bayesian method indicated the probability of a change occurring as ≥50%. Change points detected in the CDC ILI data were the gold standard with which change points found in the Web-based sources were compared. Change points of the Web-based sources that occurred during the exact week, 1 preceding week, or 1 week after the CDC change points were considered matching or true change points. This was done to account for any reporting lags that can be common with surveillance data. The number of change points for each data source was compared, and sensitivity and PPV for the detection of change points were calculated for each of the Web-based sources.</p>
          
        </sec>
        <sec>
          <title>Sensitivity and Positive Predictive Values</title>
          <p>Sensitivity and PPV were computed for each Web-based source using the change points detected for that Web-based source that matched change points detected for the CDC ILINet system (true positives), change points detected for the ILINet system but not for the Web-based source (false negatives), and change points detected for the Web-based source but not for the ILINet system (false positives). Sensitivity was calculated by dividing the true positives for each Web-based source by the total of true positives and false negatives, which would be the total number of CDC change points [<xref ref-type="bibr" rid="ref47">47</xref>]. PPV were calculated by dividing the true positives for each Web-based source by the total of true positives and false positives, which would be the total change points for that particular Web-based source [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
          
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Sample Characteristics</title>
        <p>A summary of the count data that were collected and analyzed for the CDC, Google, Twitter, and Wikipedia for the 2012-2015 influenza seasons is provided (<xref ref-type="table" rid="table1">Table 1</xref>). There was year-to-year variability in the average weekly counts of events included for each of the data sources. For most of the data sources, the 2012-2013 influenza season had the highest average number of weekly counts. The 2013-2014 influenza season had the lowest average number for the CDC and Google Flu Trends, whereas the 2014-2015 influenza season had the lowest average number for Twitter and Wikipedia. Note that the 2014-2015 influenza season consisted of 34 total MMWR weeks because whereas most epidemiologic years are comprised of 52 MMWR weeks, the 2014-2015 epidemiologic year had 53 weeks due to a preceding calendar leap year. <xref ref-type="table" rid="table1">Table 1</xref> further summarizes the data information.</p>
        
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of weekly Influenza-like Illness count data for the Centers for Disease Control and Prevention, Google, Twitter, and Wikipedia, 2012-2015 influenza seasons.</p>
          </caption>
          <table width="631" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="10"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top"><td><break/></td>
                <td>Influenza season</td>
                <td>CDC<sup>a</sup> ILINet<sup>b</sup></td>
                <td>Google</td>
                <td>Twitter</td>
                <td>Wikipedia</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6"><bold>2012-2013</bold></td>

              </tr>
              <tr valign="top"><td><break/></td>
                <td>MMWR<sup>c</sup> Weeks (counts/week)</td>
                <td>33</td>
                <td>33</td>
                <td>33</td>
                <td>33</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Mean</td>
                <td>19,049</td>
                <td>4121</td>
                <td>8096</td>
                <td>47,541</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Min</td>
                <td>7317</td>
                <td>1286</td>
                <td>2558</td>
                <td>29,865</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Max</td>
                <td>39,896</td>
                <td>10,555</td>
                <td>22,935</td>
                <td>114,919</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>2013-2014</bold></td>

              </tr>
              <tr valign="top"><td><break/></td>
                <td>MMWR Weeks (counts/week)</td>
                <td>33</td>
                <td>33</td>
                <td>33</td>
                <td>33</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Mean</td>
                <td>16,574</td>
                <td>2274</td>
                <td>5826</td>
                <td>25,039</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Min</td>
                <td>9033</td>
                <td>1339</td>
                <td>1196</td>
                <td>17,885</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Max</td>
                <td>28,654</td>
                <td>5008</td>
                <td>10,506</td>
                <td>36,935</td>
              </tr>
              <tr valign="top">
                <td colspan="6"><bold>2014-2015</bold></td>

              </tr>
              <tr valign="top"><td><break/></td>
                <td>MMWR Weeks (counts/week)</td>
                <td>34</td>
                <td>34</td>
                <td>34</td>
                <td>34</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Mean</td>
                <td>19,940</td>
                <td>2549</td>
                <td>2900</td>
                <td>21,918</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Min</td>
                <td>9289</td>
                <td>1144</td>
                <td>451</td>
                <td>12,958</td>
              </tr>
              <tr valign="top"><td><break/></td>
                <td>Max</td>
                <td>40,664</td>
                <td>6911</td>
                <td>8709</td>
                <td>35,232</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>CDC: Centers for Disease Control and Prevention.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>ILINet: United States Outpatient Influenza-like Illness Surveillance Network.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>MMWR: Morbidity and Mortality Weekly Report.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparison of Change Points Detected in the 2012-2015 Influenza Seasons</title>
        <p>A summary of all change points found in each data source is provided (see <xref ref-type="fig" rid="figure2">Figures 2</xref>-<xref ref-type="fig" rid="figure4">4</xref>), and a comparison of change points is shown in <xref ref-type="table" rid="table2">Table 2</xref>. For the 2012-2013 influenza season, Google had 3 total change points in common with the CDC ILINet system, which were MMWR weeks 51, 4, and 5. Twitter had 2 change points in common with the CDC’s change points, which were MMWR weeks 47 and 4. Wikipedia had only 1 change point that matched the CDC ILINet system, which was MMWR week 5.</p>
        
        <p>In the 2013-2014 influenza season, Google had a total of 4 change points (MMWR weeks 48, 50, 51, and 5) that coincided with change points detected in the CDC data. Twitter had 3 change points (MMWR weeks 48, 51, and 7) that matched change points in the CDC ILINet system’s data. Wikipedia had 2 change points in common with CDC ILI data, which were MMWR weeks 51 and 6.</p>
        
        <p>For the 2014-2015 influenza season, 4 change points (MMWR weeks 48, 50, 51, and 53) were detected in the Google data that concurred with change points identified in the CDC ILINet system. Both Twitter and Wikipedia had only 1 change point that coincided with the change points found in the CDC ILI data, which were MMWR weeks 50 and 53, respectively.</p>
        
        
      
      </sec>
      <sec>
        <title>Comparison of Sensitivity and Positive Predictive Value Detected Among Web-Based Sources</title>
        <p>Next, we computed the sensitivity and PPV for each of the Web-based sources using the CDC ILI data as the gold standard. As shown in <xref ref-type="table" rid="table3">Table 3</xref>, results varied widely across the Web-based sources. A high sensitivity of 92% was found for Google, while the PPV for Google was 85%. A low sensitivity of 50% was calculated for Twitter; a low PPV of 43% was found for Twitter also. Wikipedia had the lowest sensitivity of 33% and lowest PPV of 40%. A table comparing sensitivity and PPV by specific influenza season is also provided (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comparison of change points detected using Bayesian change point analysis, 2012-2015 influenza seasons<sup>a</sup>.</p>
          </caption>
          <table width="625" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="82"/>
            <col width="136"/>
            <col width="106"/>
            <col width="106"/>
            <col width="123"/>
            <thead>
              <tr valign="top">
                <td>Influenza season</td>
                <td>CDC<sup>b</sup> ILINet<sup>c</sup> counts (reference)</td>
                <td>Google counts</td>
                <td>Twitter counts</td>
                <td>Wikipedia counts</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td><bold>2012-2013</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 47<sup>a</sup></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 48</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 50</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 51<sup>a</sup></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 52</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 1</td>
                <td>Week 1</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 3</td>
                <td>Week 3</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 4<sup>a</sup></td>
                <td>Week 4<sup>a</sup></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 5</td>
                <td>Week 5<sup>a</sup></td>
                <td><break/></td>
                <td>Week 5<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td><bold>2013-2014</bold></td>
                <td>Week 48</td>
                <td>Week 48<sup>a</sup></td>
                <td>Week 48<sup>a</sup></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 50</td>
                <td>Week 50<sup>a</sup></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 51<sup>a</sup></td>
                <td>Week 51<sup>a</sup></td>
                <td>Week 51<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 1</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 3</td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 4</td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 5<sup>a</sup></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 6</td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 6<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 7<sup>a</sup></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 15</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 17</td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><bold>2014-2015</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 43</td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 44</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 48</td>
                <td>Week 48<sup>a</sup></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 49</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 50</td>
                <td>Week 50<sup>a</sup></td>
                <td>Week 50<sup>a</sup></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 51<sup>a</sup></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 53</td>
                <td>Week 53<sup>a</sup></td>
                <td><break/></td>
                <td>Week 53<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 2</td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 3</td>
                <td>Week 3</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td>Week 4</td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Week 6</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td>Week 12</td>
                <td><break/></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>MMWR week indicates a corresponding change point to the CDC change points (reference).</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>CDC: Centers for Disease Control and Prevention.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>ILINet: United States Outpatient Influenza-like Illness Surveillance Network.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        
        
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Change points (dotted lines) detected by Bayesian change point analysis, 2012-2013 influenza season.</p>
          </caption>
          <graphic xlink:href="publichealth_v2i2e161_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Change points (dotted lines) detected by Bayesian change point analysis, 2013-2014 influenza season.</p>
          </caption>
          <graphic xlink:href="publichealth_v2i2e161_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Change points (dotted lines) detected by Bayesian change point analysis, 2014-2015 influenza season.</p>
          </caption>
          <graphic xlink:href="publichealth_v2i2e161_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Comparison of sensitivity and positive predictive value among Web-based sources, 2012-2015 influenza seasons.</p>
          </caption>
          <table width="558" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="124"/>
            <col width="182"/>
            <col width="207"/>
            <thead>
              <tr valign="top">
                <td>Web-based source</td>
                <td>Sensitivity (%)</td>
                <td>Positive predictive value (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Google</td>
                <td>92</td>
                <td>85</td>
              </tr>
              <tr valign="top">
                <td>Twitter</td>
                <td>50</td>
                <td>43</td>
              </tr>
              <tr valign="top">
                <td>Wikipedia</td>
                <td>33</td>
                <td>40</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Google had a total of 11 true change points (3 in the 2012-2013 influenza season, 4 in the 2013-2014 influenza season, and 4 in the 2014-2015 influenza season) that coincided with the CDC ILINet’s change points. As Google had the most change points that coincided with change points detected in the CDC ILI data, our hypothesis that Wikipedia would have the most change points was not supported. Sensitivity and PPV for event detection are important for evaluating the quality of surveillance systems [<xref ref-type="bibr" rid="ref47">47</xref>]. Google had a moderate positive predictive value and was highly sensitive, whereas Twitter and Wikipedia both had low sensitivity rates and PPVs. This finding that Google had the best correspondence is not consistent with that of the previous studies that have found Twitter and Wikipedia to perform better [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        
        <p>Google, Twitter, and Wikipedia all had some change points that aligned well with CDC ILI data; however, they did not identify all change points that were identified in the CDC data, which would be important for understanding when seasonal changes occur during an influenza season. As no Web-based source identified all detected changes in the CDC data, this could indicate that the Web-based data, itself, may be limited in capturing all changes of CDC ILI data, which is quite plausible as not every individual who experiences ILI symptoms resorts to searching or sharing health information online. On the contrary, this could indicate that the Bayesian change point analysis as a technique is not adequately sensitive for the use on Web-based data. These 3 Web-based sources need to be further studied and compared using more standard statistical methods before being incorporated as surveillance data to complement a traditional system.</p>
        
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are limitations of this study that should be noted. First, Bayesian change point analysis assumes time series data are distributed normally, which can be problematic as public health surveillance data can be variable and can have a nonnormal distribution [<xref ref-type="bibr" rid="ref43">43</xref>]. However, we were unable to test this assumption on the “bcp” package in RStudio, and this is a limitation because the “bcp” package could have incorrectly identified or missed change points, especially if there were any outliers in the data to skew the Bayesian analysis. Another major limitation to using Bayesian change point analysis is that it cannot be used as a technique to monitor real-time data [<xref ref-type="bibr" rid="ref49">49</xref>]. Bayesian change point analysis is best used to evaluate changes in historical time series data after all data have been collected. For this study, the Bayesian method was used to retrospectively evaluate data collected from the CDC, Google, Twitter, and Wikipedia after each influenza season occurred; therefore, the results cannot be directly applied for prospective use or real-time influenza surveillance.</p>
        
        <p>A possible solution to conducting real-time influenza surveillance using Web-based data may lie in using a normal distribution algorithm. Normal distribution methods that are based on historical limits and cumulative sums have been traditionally used for influenza surveillance by the CDC [<xref ref-type="bibr" rid="ref50">50</xref>]. Moreover, Pervaiz et al (2012) demonstrated that real-time influenza surveillance using Web-based data could be done more effectively using negative binomial- and Poisson-based models as opposed to normal distribution models due to the noisy nature of Web-based data and fluctuating numbers of Internet users and their activity levels [<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        
        <p>Second, for the analysis of Wikipedia views, only the “Influenza” article was used for analysis, excluding other articles on influenza medications and influenza strains. McIver and Brownstein described the effectiveness of combining multiple influenza-related Wikipedia articles for surveillance purposes [<xref ref-type="bibr" rid="ref27">27</xref>], but those were not included in this study. We assumed all views of the English-language Wikipedia “Influenza” article were by US users; however, some may have come from users in other English-speaking countries where the influenza season is very different, such as Australia.</p>
        
        <p>Third, some of our data sources may have limits. We used CDC ILI count data for the analysis, which is not standard. Most prior studies have used weighted ILI rates instead of ILI counts because the weighted rates account for population variations in the United States. Using ILI counts may have sampling biases, but we justify the use of counts because we wanted to maintain data uniformity as none of the Web-based count data accounted for or could be normalized by population and regional variations in the United States. In addition, the Bayesian change point analysis did not allow us to transpose Web-based count data on the same scale as weighted ILI rates, thus ILI counts were the best option, considering the method used. Furthermore, the Google Flu Trends data used in this study were the output of a regression model that was fitted to CDC ILI data, leading to the Google data being a closer comparison with CDC ILI data. Although the Google Flu Trends data were fitted to match CDC data, it is important to note that these were readily available to the public as well as practitioners, justifying their use.</p>
        
        <p>Fourth, data duplication could be an issue with each data source used in this study. Internet users can use a single website for multiple information searches and shares, and a single Internet user can use multiple websites for the same information search or share [<xref ref-type="bibr" rid="ref51">51</xref>]. For example, a user can view the Wikipedia “Influenza” article multiple times and each view would be considered as a separate count [<xref ref-type="bibr" rid="ref37">37</xref>]. Neither Google Flu Trends nor HealthTweets can distinguish or remove multiple searches and tweets by a single user [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. In addition, there is no way, in publicly available data, to distinguish when a single user searches both Wikipedia and Google for the same information. The CDC ILINet system does not differentiate when a single patient makes repeated outpatient visits to the same participating health care provider or when a single patient makes outpatient visits to multiple health care providers for the same illness. This issue of data duplication should be further investigated in future studies.</p>
        
        <p>Finally, Internet users are, on average, younger than the general U.S. population [<xref ref-type="bibr" rid="ref52">52</xref>]. Although this difference may be viewed as a limitation to using Web-based data for influenza surveillance, younger age groups (0-4 years, 5-24 years, and 25-49 years) account for a majority of the outpatient ILI counts that are reported to the CDC ILINet system [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        
      </sec>
      <sec>
        <title>Future Research</title>
        <p>There is more substantive information in the content of Web-based sources that is not accounted for in count data of Web-based sources. Recent research has already begun to conduct content analyses of Web-based sources such as chat forums, Facebook, and Twitter in order to understand the health experiences and needs addressed by Internet users. Content analyses have proven valuable for both communicable and noncommunicable diseases because Internet users share and search about various health experiences ranging from mental health [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>] to substance use [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref56">56</xref>] to the health needs of sexual minorities [<xref ref-type="bibr" rid="ref57">57</xref>]. In addition, public health surveillance can be strengthened by combining various data sources, whether Web-based or traditional. Santillana et al (2015) found that when data from Google, Twitter, hospital records, and a participatory surveillance system were combined, influenza activity was predicted more accurately than and up to 4 weeks before the CDC [<xref ref-type="bibr" rid="ref58">58</xref>]. More research should be carried out in this area to identify the best combination of traditional and novel data sources for influenza surveillance.</p>
        
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>To our knowledge, this is the first comparison to evaluate Google, Twitter, and Wikipedia as possible data sources for influenza surveillance against a common gold standard (the CDC ILINet system). Of the 3 Web-based sources, Google had the best combination of sensitivity and PPV in detecting Bayesian change points in influenza-related data streams. This finding is not consistent with existing research that has compared Google and Twitter data or Google and Wikipedia data, which could be attributed to the analysis of different influenza seasons, the novel use of the Bayesian method in this study, or the fact that Google Flu Trends data were fitted to CDC data. Further research should assess the substantive health content contained within these 3 Web-based sources, the surveillance value of combining these sources, and the ability of these sources to detect influenza activity using other statistical methods.</p>
        
        
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Comparison of sensitivity and positive predictive value (PPV) among web-based sources by specific influenza season.</p>
        <media xlink:href="publichealth_v2i2e161_app1.pdf" xlink:title="PDF File (Adobe PDF File), 105KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CDC</term>
          <def>
            <p>Centers for Disease Control and Prevention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ILI</term>
          <def>
            <p>influenza-like illness</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ILINet</term>
          <def>
            <p>United States Outpatient Influenza-like Illness Surveillance Network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MCMC</term>
          <def>
            <p>Markov Chain Monte Carlo</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MMWR</term>
          <def>
            <p>Morbidity and Mortality Weekly Report</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank Dr. Heather Rubino (Florida Department of Health), Sophie Smith (Centers for Disease Control and Prevention), and Matthew Biggerstaff (Centers for Disease Control and Prevention) for their insight and expertise with understanding current influenza surveillance systems. We also acknowledge Dr. John Emerson (Yale University), Dr. Chandra Erdman (Management Leadership for Tomorrow), and Dr. Xiaofei Wang (Amherst College) for their assistance with understanding the R package “bcp” version 4.0.0. Finally, we extend special appreciation to Google Inc, Dr. Mark Dredze and his team at HealthTweets.org, and Wikimedia Statistics for making their data publicly accessible.</p>
      
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>JDS conceptualized and designed the study. RLC, RSH, and CWS provided feedback for the study design. JDS acquired data and performed the statistical analysis. JDS, RLC, RSH, and CWS contributed to the interpretation of findings. JDS drafted and revised the manuscript according to feedback provided by RLC, RSH, and CWS. All authors approved the final version of the manuscript.</p>
        
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
        
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chunara</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Goldstein</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Patterson-Lomba</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Estimating influenza attack rates in the United States using a participatory cohort</article-title>
        <source>Sci Rep</source>  
        <year>2015</year>  
        <volume>5</volume>  
        <fpage>9540</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/srep09540"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/srep09540</pub-id>
        <pub-id pub-id-type="medline">25835538</pub-id>
        <pub-id pub-id-type="pii">srep09540</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <collab>Centers for Disease Control and Prevention</collab>
        </person-group>
        <article-title>Estimates of deaths associated with seasonal influenza --- United States, 1976-2007</article-title>
        <source>MMWR Morb Mortal Wkly Rep</source>  
        <year>2010</year>  
        <volume>59</volume>  
        <issue>33</issue>  
        <fpage>1057</fpage>  
        <lpage>1062</lpage>  
        <pub-id pub-id-type="medline">20798667</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <year>2015</year>  
        <access-date>2016-03-26</access-date>
        <comment>Overview of influenza surveillance in the United States
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/flu/weekly/overview.htm">http://www.cdc.gov/flu/weekly/overview.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHxdKs79"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>De Silva</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Segre</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Eliciting disease data from Wikipedia articles</article-title>
        <year>2015</year>  
        <conf-name>Ninth International AAAI Conference on Web and Social Media</conf-name>
        <conf-date>2015</conf-date>
        <conf-loc>Oxford, England</conf-loc>
        <fpage>26</fpage>  
        <lpage>33</lpage> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Buehler</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Hopkins</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Overhage</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Sosin</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Tong</surname>
            <given-names>V</given-names>
          </name>
        </person-group>
        <article-title>Framework for evaluating public health surveillance systems for early detection of outbreaks: recommendations from the CDC Working Group</article-title>
        <source>MMWR Recomm Rep</source>  
        <year>2004</year>  
        <month>05</month>  
        <day>7</day>  
        <volume>53</volume>  
        <issue>RR-5</issue>  
        <fpage>1</fpage>  
        <lpage>11</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/mmwr/preview/mmwrhtml/rr5305a1.htm"/>
        </comment>  
        <pub-id pub-id-type="medline">15129191</pub-id>
        <pub-id pub-id-type="pii">rr5305a1</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Buehler</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Sonricker</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Paladini</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Soper</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Mostashari</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Syndromic surveillance practice in the United States: findings from a survey of state, territorial, and selected local health departments</article-title>
        <source>Adv Dis Surveill</source>  
        <year>2008</year>  
        <volume>6</volume>  
        <issue>3</issue>  
        <fpage>1</fpage>  
        <lpage>20</lpage> </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Henning</surname>
            <given-names>KJ</given-names>
          </name>
        </person-group>
        <article-title>What is syndromic surveillance?</article-title>
        <source>MMWR Suppl</source>  
        <year>2004</year>  
        <month>09</month>  
        <day>24</day>  
        <volume>53</volume>  
        <fpage>5</fpage>  
        <lpage>11</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/mmwr/preview/mmwrhtml/su5301a3.htm"/>
        </comment>  
        <pub-id pub-id-type="medline">15714620</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bernardo</surname>
            <given-names>TM</given-names>
          </name>
          <name name-style="western">
            <surname>Rajic</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Robiadek</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pham</surname>
            <given-names>MT</given-names>
          </name>
          <name name-style="western">
            <surname>Funk</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Scoping review on search queries and social media for disease surveillance: a chronology of innovation</article-title>
        <source>J Med Internet Res</source>  
        <year>2013</year>  
        <volume>15</volume>  
        <issue>7</issue>  
        <fpage>e147</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/7/e147/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2740</pub-id>
        <pub-id pub-id-type="medline">23896182</pub-id>
        <pub-id pub-id-type="pii">v15i7e147</pub-id>
        <pub-id pub-id-type="pmcid">PMC3785982</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
        <source>J Med Internet Res</source>  
        <year>2009</year>  
        <volume>11</volume>  
        <issue>1</issue>  
        <fpage>e11</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2009/1/e11/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
        <pub-id pub-id-type="medline">19329408</pub-id>
        <pub-id pub-id-type="pii">v11i1e11</pub-id>
        <pub-id pub-id-type="pmcid">PMC2762766</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salathé</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bengtsson</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Bodnar</surname>
            <given-names>TJ</given-names>
          </name>
          <name name-style="western">
            <surname>Brewer</surname>
            <given-names>DD</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Buckee</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Campbell</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Cattuto</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Khandelwal</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mabry</surname>
            <given-names>PL</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Digital epidemiology</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2012</year>  
        <volume>8</volume>  
        <issue>7</issue>  
        <fpage>e1002616</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1002616"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002616</pub-id>
        <pub-id pub-id-type="medline">22844241</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-12-00494</pub-id>
        <pub-id pub-id-type="pmcid">PMC3406005</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
        <source>International Telecommunication Union</source>  
        <access-date>2016-03-26</access-date>
        <comment>ICT facts and figures: the world in 2015
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.itu.int/en/ITU-D/Statistics/Documents/facts/ICTFactsFigures2015.pdf">http://www.itu.int/en/ITU-D/Statistics/Documents/facts/ICTFactsFigures2015.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHxY2tQX"/></comment> </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ginsberg</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Mohebbi</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Patel</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Brammer</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Smolinski</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Brilliant</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Detecting influenza epidemics using search engine query data</article-title>
        <source>Nature</source>  
        <year>2009</year>  
        <month>02</month>  
        <day>19</day>  
        <volume>457</volume>  
        <issue>7232</issue>  
        <fpage>1012</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
        <pub-id pub-id-type="medline">19020500</pub-id>
        <pub-id pub-id-type="pii">nature07634</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Conrad</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Fowlkes</surname>
            <given-names>AL</given-names>
          </name>
          <name name-style="western">
            <surname>Mohebbi</surname>
            <given-names>MH</given-names>
          </name>
        </person-group>
        <article-title>Assessing Google flu trends performance in the United States during the 2009 influenza virus A (H1N1) pandemic</article-title>
        <source>PLoS One</source>  
        <year>2011</year>  
        <volume>6</volume>  
        <issue>8</issue>  
        <fpage>e23610</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0023610"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0023610</pub-id>
        <pub-id pub-id-type="medline">21886802</pub-id>
        <pub-id pub-id-type="pii">PONE-D-11-06712</pub-id>
        <pub-id pub-id-type="pmcid">PMC3158788</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Butler</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>When Google got flu wrong</article-title>
        <source>Nature</source>  
        <year>2013</year>  
        <month>02</month>  
        <day>14</day>  
        <volume>494</volume>  
        <issue>7436</issue>  
        <fpage>155</fpage>  
        <lpage>6</lpage>  
        <pub-id pub-id-type="doi">10.1038/494155a</pub-id>
        <pub-id pub-id-type="medline">23407515</pub-id>
        <pub-id pub-id-type="pii">494155a</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lazer</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Kennedy</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>King</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Big data. The parable of Google Flu: traps in big data analysis</article-title>
        <source>Science</source>  
        <year>2014</year>  
        <month>03</month>  
        <day>14</day>  
        <volume>343</volume>  
        <issue>6176</issue>  
        <fpage>1203</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.1126/science.1248506</pub-id>
        <pub-id pub-id-type="medline">24626916</pub-id>
        <pub-id pub-id-type="pii">343/6176/1203</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Olson</surname>
            <given-names>DR</given-names>
          </name>
          <name name-style="western">
            <surname>Konty</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Paladini</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Viboud</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Simonsen</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Reassessing Google Flu Trends data for detection of seasonal and pandemic influenza: a comparative epidemiological study at three geographic scales</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2013</year>  
        <volume>9</volume>  
        <issue>10</issue>  
        <fpage>e1003256</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003256"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003256</pub-id>
        <pub-id pub-id-type="medline">24146603</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-13-00957</pub-id>
        <pub-id pub-id-type="pmcid">PMC3798275</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
        <source>Google</source>  
        <access-date>2016-03-26</access-date>
        <comment>Google Flu Trends
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.google.org/flutrends/about/">http://www.google.org/flutrends/about/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHx8E3SD"/></comment> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Twitter: big data opportunities</article-title>
        <source>Science</source>  
        <year>2014</year>  
        <month>07</month>  
        <day>11</day>  
        <volume>345</volume>  
        <issue>6193</issue>  
        <fpage>148</fpage>  
        <pub-id pub-id-type="doi">10.1126/science.345.6193.148-a</pub-id>
        <pub-id pub-id-type="medline">25013052</pub-id>
        <pub-id pub-id-type="pii">345/6193/148-a</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aslam</surname>
            <given-names>AA</given-names>
          </name>
          <name name-style="western">
            <surname>Tsou</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Spitzberg</surname>
            <given-names>BH</given-names>
          </name>
          <name name-style="western">
            <surname>An</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Gawron</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Gupta</surname>
            <given-names>DK</given-names>
          </name>
          <name name-style="western">
            <surname>Peddecord</surname>
            <given-names>KM</given-names>
          </name>
          <name name-style="western">
            <surname>Nagel</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Allen</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lindsay</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>The reliability of tweets as a supplementary method of seasonal influenza surveillance</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <volume>16</volume>  
        <issue>11</issue>  
        <fpage>e250</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/11/e250/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3532</pub-id>
        <pub-id pub-id-type="medline">25406040</pub-id>
        <pub-id pub-id-type="pii">v16i11e250</pub-id>
        <pub-id pub-id-type="pmcid">PMC4260066</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic</article-title>
        <source>PLoS One</source>  
        <year>2013</year>  
        <volume>8</volume>  
        <issue>12</issue>  
        <fpage>e83672</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0083672"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0083672</pub-id>
        <pub-id pub-id-type="medline">24349542</pub-id>
        <pub-id pub-id-type="pii">PONE-D-13-35058</pub-id>
        <pub-id pub-id-type="pmcid">PMC3857320</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Signorini</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Segre</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Polgreen</surname>
            <given-names>PM</given-names>
          </name>
        </person-group>
        <article-title>The use of Twitter to track levels of disease activity and public concern in the U.S. during the influenza A H1N1 pandemic</article-title>
        <source>PLoS One</source>  
        <year>2011</year>  
        <volume>6</volume>  
        <issue>5</issue>  
        <fpage>e19467</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0019467"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0019467</pub-id>
        <pub-id pub-id-type="medline">21573238</pub-id>
        <pub-id pub-id-type="pii">PONE-D-10-02464</pub-id>
        <pub-id pub-id-type="pmcid">PMC3087759</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nagar</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Yuan</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Freifeld</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Nojima</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Chunara</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>A case study of the New York City 2012-2013 influenza season with daily geocoded Twitter data from temporal and spatiotemporal perspectives</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <volume>16</volume>  
        <issue>10</issue>  
        <fpage>e236</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/10/e236/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3416</pub-id>
        <pub-id pub-id-type="medline">25331122</pub-id>
        <pub-id pub-id-type="pii">v16i10e236</pub-id>
        <pub-id pub-id-type="pmcid">PMC4259880</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Maskawa</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Twitter catches the flu: detecting influenza epidemics using Twitter</article-title>
        <year>2011</year>  
        <conf-name>Conference on Empirical Natural Language Processing Conference (EMNLP)</conf-name>
        <conf-date>2011</conf-date>
        <conf-loc>Edinburgh, Scotland</conf-loc>
        <fpage>1568</fpage>  
        <lpage>1576</lpage> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dugas</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Using Social Media to Perform Local Influenza Surveillance in an Inner-City Hospital: A Retrospective Observational Study</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2015</year>  
        <volume>1</volume>  
        <issue>1</issue>  
        <fpage>e5</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2015/1/e5/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.4472</pub-id>
        <pub-id pub-id-type="medline">27014744</pub-id>
        <pub-id pub-id-type="pmcid">PMC4803078</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Generous</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Deshpande</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>SY</given-names>
          </name>
          <name name-style="western">
            <surname>Priedhorsky</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Global disease monitoring and forecasting with Wikipedia</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2014</year>  
        <month>11</month>  
        <volume>10</volume>  
        <issue>11</issue>  
        <fpage>e1003892</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003892"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003892</pub-id>
        <pub-id pub-id-type="medline">25392913</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-14-00678</pub-id>
        <pub-id pub-id-type="pmcid">PMC4231164</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hickmann</surname>
            <given-names>KS</given-names>
          </name>
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Priedhorsky</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Generous</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Hyman</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Deshpande</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>SY</given-names>
          </name>
        </person-group>
        <article-title>Forecasting the 2013-2014 influenza season using Wikipedia</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>11</volume>  
        <issue>5</issue>  
        <fpage>e1004239</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1004239"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004239</pub-id>
        <pub-id pub-id-type="medline">25974758</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-14-01771</pub-id>
        <pub-id pub-id-type="pmcid">PMC4431683</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>McIver</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Wikipedia usage estimates prevalence of influenza-like illness in the United States in near real-time</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2014</year>  
        <month>04</month>  
        <volume>10</volume>  
        <issue>4</issue>  
        <fpage>e1003581</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003581"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003581</pub-id>
        <pub-id pub-id-type="medline">24743682</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-13-02242</pub-id>
        <pub-id pub-id-type="pmcid">PMC3990502</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Laurent</surname>
            <given-names>MR</given-names>
          </name>
          <name name-style="western">
            <surname>Vickers</surname>
            <given-names>TJ</given-names>
          </name>
        </person-group>
        <article-title>Seeking health information online: does Wikipedia matter?</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2009</year>  
        <volume>16</volume>  
        <issue>4</issue>  
        <fpage>471</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=19390105"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1197/jamia.M3059</pub-id>
        <pub-id pub-id-type="medline">19390105</pub-id>
        <pub-id pub-id-type="pii">M3059</pub-id>
        <pub-id pub-id-type="pmcid">PMC2705249</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tausczik</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Faasse</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pennebaker</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Petrie</surname>
            <given-names>KJ</given-names>
          </name>
        </person-group>
        <article-title>Public anxiety and information seeking following the H1N1 outbreak: blogs, newspaper articles, and Wikipedia visits</article-title>
        <source>Health Commun</source>  
        <year>2012</year>  
        <volume>27</volume>  
        <issue>2</issue>  
        <fpage>179</fpage>  
        <lpage>85</lpage>  
        <pub-id pub-id-type="doi">10.1080/10410236.2011.571759</pub-id>
        <pub-id pub-id-type="medline">21827326</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <collab>Centers for Disease Control and Prevention</collab>
        </person-group>
        <article-title>Influenza activity - United States, 2012-2013 season and composition of the 2013-14 influenza vaccine</article-title>
        <source>MMWR Morb Mortal Wkly Rep</source>  
        <year>2013</year>  
        <volume>62</volume>  
        <issue>23</issue>  
        <fpage>473</fpage>  
        <lpage>479</lpage>  
        <pub-id pub-id-type="medline">23760189</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Epperson</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Blanton</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Kniss</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Mustaquim</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Steffens</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Wallis</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Dhara</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Leon</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Perez</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Chaves</surname>
            <given-names>SS</given-names>
          </name>
          <name name-style="western">
            <surname>Elal</surname>
            <given-names>AA</given-names>
          </name>
          <name name-style="western">
            <surname>Gubareva</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Villanueva</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Bresee</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cox</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Finelli</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Brammer</surname>
            <given-names>L</given-names>
          </name>
          <collab>Influenza Division‚ National Center for Immunization and Respiratory Diseases‚ CDC</collab>
        </person-group>
        <article-title>Influenza activity - United States, 2013-14 season and composition of the 2014-15 influenza vaccines</article-title>
        <source>MMWR Morb Mortal Wkly Rep</source>  
        <year>2014</year>  
        <month>06</month>  
        <day>6</day>  
        <volume>63</volume>  
        <issue>22</issue>  
        <fpage>483</fpage>  
        <lpage>90</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.cdc.gov/mmwr/preview/mmwrhtml/mm6322a2.htm"/>
        </comment>  
        <pub-id pub-id-type="medline">24898165</pub-id>
        <pub-id pub-id-type="pii">mm6322a2</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Appiah</surname>
            <given-names>GD</given-names>
          </name>
          <name name-style="western">
            <surname>Blanton</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>D'Mello</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Kniss</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mustaquim</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Steffens</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Dhara</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Cohen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chaves</surname>
            <given-names>SS</given-names>
          </name>
          <name name-style="western">
            <surname>Bresee</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wallis</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Abd Elal</surname>
            <given-names>AI</given-names>
          </name>
          <name name-style="western">
            <surname>Gubareva</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Wentworth</surname>
            <given-names>DE</given-names>
          </name>
          <name name-style="western">
            <surname>Katz</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Jernigan</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Brammer</surname>
            <given-names>L</given-names>
          </name>
          <collab>Centers for Disease Control and Prevention (CDC)</collab>
        </person-group>
        <article-title>Influenza activity - United States, 2014-15 season and composition of the 2015-16 influenza vaccine</article-title>
        <source>MMWR Morb Mortal Wkly Rep</source>  
        <year>2015</year>  
        <month>06</month>  
        <day>5</day>  
        <volume>64</volume>  
        <issue>21</issue>  
        <fpage>583</fpage>  
        <lpage>90</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.cdc.gov/mmwr/preview/mmwrhtml/mm6421a5.htm"/>
        </comment>  
        <pub-id pub-id-type="medline">26042650</pub-id>
        <pub-id pub-id-type="pii">mm6421a5</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <access-date>2016-03-26</access-date>
        <comment>MMWR weeks
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://wwwn.cdc.gov:443/nndss/document/MMWR_Week_overview.pdf">https://wwwn.cdc.gov:443/nndss/document/MMWR_Week_overview.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHxPOqx0"/></comment> </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <access-date>2016-03-26</access-date>
        <comment>FluView Interactive
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://gis.cdc.gov/grasp/fluview/fluportaldashboard.html">http://gis.cdc.gov/grasp/fluview/fluportaldashboard.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHxKR4m4"/></comment> </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>HealthTweets.org: a platform for public health surveillance using Twitter</article-title>
        <year>2014</year>  
        <conf-name>Twenty-Eighth AAAI Conference on Artificial Intelligence</conf-name>
        <conf-date>2014</conf-date>
        <conf-loc>Quebec City, Quebec, Canada</conf-loc></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lamb</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Separating fact from fear: tracking flu infections on Twitter</article-title>
        <source>Proceedings of the 2013 Conference of the North American Chapter of the Association for Computational Linguistics (NAACL): Human Language Technologies</source>  
        <year>2013</year>  
        <conf-name>Conference of the North American Chapter of the Association for Computational Linguistics (NAACL): Human Language Technologies</conf-name>
        <conf-date>2013</conf-date>
        <conf-loc>Atlanta, GA</conf-loc>
        <fpage>789</fpage>  
        <lpage>795</lpage> </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
        <source>Wikimedia</source>  
        <access-date>2016-03-26</access-date>
        <comment>Page view statistics for Wikimedia projects
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dumps.wikimedia.org/other/pagecounts-raw/">http://dumps.wikimedia.org/other/pagecounts-raw/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHwztskJ"/></comment> </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>De Mauro</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Greco</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Grimaldi</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>What is big data? A consensual definition and a review of key research topics</article-title>
        <source>Proceedings of AIP Conference</source>  
        <year>2015</year>  
        <conf-name>4th International Conference on Integrated Information</conf-name>
        <conf-date>September 5-8, 2014</conf-date>
        <conf-loc>Madrid, Spain</conf-loc>
        <publisher-name>AIP Publishing LLC</publisher-name>
        <fpage>97</fpage>  
        <lpage>104</lpage>  
        <pub-id pub-id-type="doi">10.1063/1.4907823</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Erdman</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Emerson</surname>
            <given-names>JW</given-names>
          </name>
        </person-group>
        <article-title>bcp: an R package for performing a Bayesian analysis of change point problems</article-title>
        <source>J. Stat. Soft</source>  
        <year>2007</year>  
        <volume>23</volume>  
        <issue>3</issue>  
        <pub-id pub-id-type="doi">10.18637/jss.v023.i03</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Erdman</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Emerson</surname>
            <given-names>JW</given-names>
          </name>
        </person-group>
        <article-title>A fast Bayesian change point analysis for the segmentation of microarray data</article-title>
        <source>Bioinformatics</source>  
        <year>2008</year>  
        <month>10</month>  
        <day>1</day>  
        <volume>24</volume>  
        <issue>19</issue>  
        <fpage>2143</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bioinformatics.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=18667443"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/bioinformatics/btn404</pub-id>
        <pub-id pub-id-type="medline">18667443</pub-id>
        <pub-id pub-id-type="pii">btn404</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Schluter</surname>
            <given-names>PJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hamilton</surname>
            <given-names>GJ</given-names>
          </name>
          <name name-style="western">
            <surname>Deely</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Ardagh</surname>
            <given-names>MW</given-names>
          </name>
        </person-group>
        <article-title>Impact of integrated health system changes, accelerated due to an earthquake, on emergency department attendances and acute admissions: a Bayesian change-point analysis</article-title>
        <source>BMJ Open</source>  
        <year>2016</year>  
        <volume>6</volume>  
        <issue>5</issue>  
        <fpage>e010709</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&#38;pmid=27169741"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmjopen-2015-010709</pub-id>
        <pub-id pub-id-type="medline">27169741</pub-id>
        <pub-id pub-id-type="pii">bmjopen-2015-010709</pub-id>
        <pub-id pub-id-type="pmcid">PMC4874100</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ellis</surname>
            <given-names>BK</given-names>
          </name>
          <name name-style="western">
            <surname>Stanford</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Goodman</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Stafford</surname>
            <given-names>CP</given-names>
          </name>
          <name name-style="western">
            <surname>Gustafson</surname>
            <given-names>DL</given-names>
          </name>
          <name name-style="western">
            <surname>Beauchamp</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Chess</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Craft</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Deleray</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Hansen</surname>
            <given-names>BS</given-names>
          </name>
        </person-group>
        <article-title>Long-term effects of a trophic cascade in a large lake ecosystem</article-title>
        <source>Proc Natl Acad Sci U S A</source>  
        <year>2011</year>  
        <month>01</month>  
        <day>18</day>  
        <volume>108</volume>  
        <issue>3</issue>  
        <fpage>1070</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=21199944"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1073/pnas.1013006108</pub-id>
        <pub-id pub-id-type="medline">21199944</pub-id>
        <pub-id pub-id-type="pii">1013006108</pub-id>
        <pub-id pub-id-type="pmcid">PMC3024674</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kass-Hout</surname>
            <given-names>TA</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>McMurray</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Park</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Buckeridge</surname>
            <given-names>DL</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Finelli</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Groseclose</surname>
            <given-names>SL</given-names>
          </name>
        </person-group>
        <article-title>Application of change point analysis to daily influenza-like illness emergency department visits</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2012</year>  
        <volume>19</volume>  
        <issue>6</issue>  
        <fpage>1075</fpage>  
        <lpage>81</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=22759619"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000793</pub-id>
        <pub-id pub-id-type="medline">22759619</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2011-000793</pub-id>
        <pub-id pub-id-type="pmcid">PMC3534458</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Emerson</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>arxiv</source>  
        <year>2015</year>  
        <access-date>2016-10-17</access-date>
        <comment>Bayesian change point analysis of linear models on general graphs
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1509.00817">https://arxiv.org/pdf/1509.00817</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6lJxaahQr"/></comment> </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
        <source>Rstudio</source>  
        <year>2015</year>  
        <access-date>2016-03-26</access-date>
        <publisher-loc>Boston, MA</publisher-loc>
        <publisher-name>RStudio, Inc</publisher-name>
        <comment>RStudio: integrated development for R
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.rstudio.com/">https://www.rstudio.com/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHzyHxHu"/></comment> </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Barry</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Hartigan</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A Bayesian analysis for change point problems</article-title>
        <source>JASA</source>  
        <year>1993</year>  
        <volume>88</volume>  
        <issue>421</issue>  
        <fpage>309</fpage>  
        <lpage>319</lpage> </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>German</surname>
            <given-names>RR</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Horan</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Milstein</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Pertowski</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>Waller</surname>
            <given-names>MN</given-names>
          </name>
          <collab>Guidelines Working Group Centers for Disease Control and Prevention (CDC)</collab>
        </person-group>
        <article-title>Updated guidelines for evaluating public health surveillance systems: recommendations from the Guidelines Working Group</article-title>
        <source>MMWR Recomm Rep</source>  
        <year>2001</year>  
        <month>07</month>  
        <day>27</day>  
        <volume>50</volume>  
        <issue>RR-13</issue>  
        <fpage>1</fpage>  
        <lpage>35; quiz CE1-7</lpage>  
        <pub-id pub-id-type="medline">18634202</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Twitter improves influenza forecasting</article-title>
        <source>PLoS Curr</source>  
        <year>2014</year>  
        <volume>6</volume>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.1371/currents.outbreaks.90b9ed0f59bae4ccaa683a39865d9117"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/currents.outbreaks.90b9ed0f59bae4ccaa683a39865d9117</pub-id>
        <pub-id pub-id-type="medline">25642377</pub-id>
        <pub-id pub-id-type="pmcid">PMC4234396</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kass-Hout</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Google</source>  
        <year>2013</year>  
        <access-date>2016-03-26</access-date>
        <comment>Change point analysis: Introduction
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://sites.google.com/site/changepointanalysis/">https://sites.google.com/site/changepointanalysis/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHwpzPHi"/></comment> </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pervaiz</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Pervaiz</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Abdur</surname>
            <given-names>RN</given-names>
          </name>
          <name name-style="western">
            <surname>Saif</surname>
            <given-names>U</given-names>
          </name>
        </person-group>
        <article-title>FluBreaks: early epidemic detection from Google flu trends</article-title>
        <source>J Med Internet Res</source>  
        <year>2012</year>  
        <volume>14</volume>  
        <issue>5</issue>  
        <fpage>e125</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/5/e125/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2102</pub-id>
        <pub-id pub-id-type="medline">23037553</pub-id>
        <pub-id pub-id-type="pii">v14i5e125</pub-id>
        <pub-id pub-id-type="pmcid">PMC3510767</pub-id></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wu-Chen</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Integrating and mining virtual communities across multiple online social networks: concepts, approaches and challenges</article-title>
        <source>Proceedings of the Fourth International Conference on Digital Information and Communication Technology and its Applications</source>  
        <year>2014</year>  
        <conf-name>The Fourth International Conference on Digital Information and Communication Technology and its Applications</conf-name>
        <conf-date>2014</conf-date>
        <conf-loc>Bangkok, Thailand</conf-loc>
        <fpage>199</fpage>  
        <lpage>204</lpage>  
        <pub-id pub-id-type="doi">10.1109/DICTAP.2014.6821682</pub-id></nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
        <source>Pew Research Center</source>  
        <access-date>2016-03-26</access-date>
        <comment>Internet user demographics
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/data-trend/internet-use/latest-stats/">http://www.pewinternet.org/data-trend/internet-use/latest-stats/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6gHwYYhqI"/></comment> </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cavazos-Rehg</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Krauss</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Sowles</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Connolly</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Rosas</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Bharadwaj</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bierut</surname>
            <given-names>LJ</given-names>
          </name>
        </person-group>
        <article-title>A content analysis of depression-related Tweets</article-title>
        <source>Comput Human Behav</source>  
        <year>2016</year>  
        <month>01</month>  
        <day>1</day>  
        <volume>54</volume>  
        <fpage>351</fpage>  
        <lpage>357</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.chb.2015.08.023</pub-id>
        <pub-id pub-id-type="medline">26392678</pub-id>
        <pub-id pub-id-type="pmcid">PMC4574287</pub-id></nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reavley</surname>
            <given-names>NJ</given-names>
          </name>
          <name name-style="western">
            <surname>Pilkington</surname>
            <given-names>PD</given-names>
          </name>
        </person-group>
        <article-title>Use of Twitter to monitor attitudes toward depression and schizophrenia: an exploratory study</article-title>
        <source>PeerJ</source>  
        <year>2014</year>  
        <volume>2</volume>  
        <fpage>e647</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.7717/peerj.647"/>
        </comment>  
        <pub-id pub-id-type="doi">10.7717/peerj.647</pub-id>
        <pub-id pub-id-type="medline">25374786</pub-id>
        <pub-id pub-id-type="pii">647</pub-id>
        <pub-id pub-id-type="pmcid">PMC4217192</pub-id></nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>AT</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>What Online Communities Can Tell Us About Electronic Cigarettes and Hookah Use: A Study Using Text Mining and Visualization Techniques</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <volume>17</volume>  
        <issue>9</issue>  
        <fpage>e220</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/9/e220/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4517</pub-id>
        <pub-id pub-id-type="medline">26420469</pub-id>
        <pub-id pub-id-type="pii">v17i9e220</pub-id></nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Krauss</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Sowles</surname>
            <given-names>SJ</given-names>
          </name>
          <name name-style="western">
            <surname>Moreno</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Zewdie</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Grucza</surname>
            <given-names>RA</given-names>
          </name>
          <name name-style="western">
            <surname>Bierut</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Cavazos-Rehg</surname>
            <given-names>PA</given-names>
          </name>
        </person-group>
        <article-title>Hookah-Related Twitter Chatter: A Content Analysis</article-title>
        <source>Prev Chronic Dis</source>  
        <year>2015</year>  
        <volume>12</volume>  
        <fpage>E121</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/pcd/issues/2015/15_0140.htm"/>
        </comment>  
        <pub-id pub-id-type="doi">10.5888/pcd12.150140</pub-id>
        <pub-id pub-id-type="medline">26226068</pub-id>
        <pub-id pub-id-type="pii">E121</pub-id>
        <pub-id pub-id-type="pmcid">PMC4523113</pub-id></nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Krueger</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>SD</given-names>
          </name>
        </person-group>
        <article-title>Twitter: A Novel Tool for Studying the Health and Social Needs of Transgender Communities</article-title>
        <source>JMIR Ment Health</source>  
        <year>2015</year>  
        <volume>2</volume>  
        <issue>2</issue>  
        <fpage>e16</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://mental.jmir.org/2015/2//"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/mental.4113</pub-id>
        <pub-id pub-id-type="medline">26082941</pub-id>
        <pub-id pub-id-type="pmcid">PMC4465794</pub-id></nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>AT</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Nsoesie</surname>
            <given-names>EO</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Combining Search, Social Media, and Traditional Data Sources to Improve Influenza Surveillance</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2015</year>  
        <month>10</month>  
        <volume>11</volume>  
        <issue>10</issue>  
        <fpage>e1004513</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1004513"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004513</pub-id>
        <pub-id pub-id-type="medline">26513245</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-15-00856</pub-id>
        <pub-id pub-id-type="pmcid">PMC4626021</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
