<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v5i2e12214</article-id>
      <article-id pub-id-type="pmid">30946017</article-id>
      <article-id pub-id-type="doi">10.2196/12214</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Improved Real-Time Influenza Surveillance: Using Internet Search Data in Eight Latin American Countries</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sanchez</surname>
            <given-names>Travis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>McLeod</surname>
            <given-names>Bob</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pollett</surname>
            <given-names>Simon</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
          <name name-style="western">
            <surname>Clemente</surname>
            <given-names>Leonardo</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8939-8841</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Fred</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1026-5734</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3" corresp="yes">
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>Mauricio</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Computational Health Informatics Program</institution>
            <institution>Boston Children's Hospital</institution>
            <addr-line>1 Autumn St</addr-line>
            <addr-line>Boston, MA, 02215</addr-line>
            <country>United States</country>
            <phone>1 617 919 1795</phone>
            <email>msantill@g.harvard.edu</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-4206-418X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>School of Engineering and Sciences</institution>
      <institution>Tecnologico de Monterrey</institution>  
      <addr-line>Monterrey</addr-line>
      <country>Mexico</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Computational Health Informatics Program</institution>
      <institution>Boston Children's Hospital</institution>  
      <addr-line>Boston, MA</addr-line>
      <country>United States</country></aff>
      <aff id="aff3">
      <label>3</label>
      <institution>Department of Pediatrics</institution>
      <institution>Harvard Medical School</institution>  
      <addr-line>Boston, MA</addr-line>
      <country>United States</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Mauricio Santillana 
        <email>msantill@g.harvard.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><season>Apr-Jun</season><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>04</day>
        <month>04</month>
        <year>2019</year>
      </pub-date>
      <volume>5</volume>
      <issue>2</issue>
      <elocation-id>e12214</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>14</day>
          <month>9</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>18</day>
          <month>1</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>2</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>2</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Leonardo Clemente, Fred Lu, Mauricio Santillana. Originally published in JMIR Public Health and Surveillance (http://publichealth.jmir.org), 04.04.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on http://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://publichealth.jmir.org/2019/2/e12214/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
        <title>Background</title> 
        <p>Novel influenza surveillance systems that leverage Internet-based real-time data sources including Internet search frequencies, social-network information, and crowd-sourced flu surveillance tools have shown improved accuracy over the past few years in data-rich countries like the United States. These systems not only track flu activity accurately, but they also report flu estimates a week or more ahead of the publication of reports produced by healthcare-based systems, such as those implemented and managed by the Centers for Disease Control and Prevention. Previous work has shown that the predictive capabilities of novel flu surveillance systems, like Google Flu Trends (GFT), in developing countries in Latin America have not yet delivered acceptable flu estimates.</p></sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to show that recent methodological improvements on the use of Internet search engine information to track diseases can lead to improved retrospective flu estimates in multiple countries in Latin America.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A machine learning-based methodology that uses flu-related Internet search activity and historical information to monitor flu activity, named ARGO (AutoRegression with Google search), was extended to generate flu predictions for 8 Latin American countries (Argentina, Bolivia, Brazil, Chile, Mexico, Paraguay, Peru, and Uruguay) for the time period: January 2012 to December of 2016. These retrospective (out-of-sample) Influenza activity predictions were compared with historically observed flu suspected cases in each country, as reported by Flunet, an influenza surveillance database maintained by the World Health Organization. For a baseline comparison, retrospective (out-of-sample) flu estimates were produced for the same time period using autoregressive models that only leverage historical flu activity information.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our results show that ARGO-like models’ predictive power outperform autoregressive models in 6 out of 8 countries in the 2012-2016 time period. Moreover, ARGO significantly improves on historical flu estimates produced by the now discontinued GFT for the time period of 2012-2015, where GFT information is publicly available.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We demonstrate here that a self-correcting machine learning method, leveraging Internet-based disease-related search activity and historical flu trends, has the potential to produce reliable and timely flu estimates in multiple Latin American countries. This methodology may prove helpful to local public health officials who design and implement interventions aimed at mitigating the effects of influenza outbreaks. Our methodology generally outperforms both the now-discontinued tool GFT, and autoregressive methodologies that exploit only historical flu activity to produce future disease estimates.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>google flu trends</kwd>
        <kwd>influenza monitoring</kwd>
        <kwd>real-time disease surveillance</kwd>
        <kwd>digital epidemiology</kwd>
        <kwd>influenza, human</kwd>
        <kwd>developing countries</kwd>
        <kwd>machine learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>With the highest mortality of any respiratory infectious disease in the young and elderly in Latin America, influenza poses significant health and economic challenges to low- and middle-income countries in the region [<xref ref-type="bibr" rid="ref1">1</xref>]. The World Health Organization (WHO) maintains a health care–based disease surveillance system that collects information on flu activity from local ministries of health around the world. Unfortunately, these reports have a common delay of at least a week in Latin America, limiting the ability for a timely response to unexpected epidemic outbreaks. Reliable surveillance systems that monitor flu activity in real time in this region would help public health institutions deploy timely vaccination campaigns and optimally allocate resources during epidemic outbreaks. Multiple research teams have proposed complementary methods to estimate and forecast flu activity in real time in data-rich countries such as the United States, using techniques ranging from statistical [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>] to mechanistic [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>] and incorporating a variety of data sources, such as internet search information, flu-related Twitter microblogs [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>], crowdsourced flu surveillance [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], clinician search activity [<xref ref-type="bibr" rid="ref10">10</xref>], electronic health records [<xref ref-type="bibr" rid="ref11">11</xref>], and Wikipedia access [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], as summarized in a study by Santillana [<xref ref-type="bibr" rid="ref14">14</xref>]. However, a reliable system that leverages internet search activity to monitor flu activity in multiple developing nations is not yet available.</p>
        <p>An early large-scale implementation of real-time disease surveillance started in 2008 with Google Flu Trends (GFT), a Web-based tool that used Google search activity to produce flu activity estimates in multiple locations around the world [<xref ref-type="bibr" rid="ref15">15</xref>]. Although GFT was initially perceived as a technological innovation, its large prediction errors during the 2009 H1N1 flu pandemic and the 2013 flu season in the United States raised methodological concerns from multiple researchers [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. A recent study by Pollet et al showed that GFT’s flu estimates in Latin America had yielded poor results [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The discontinuation of GFT in 2015 led many to believe that internet search trends were too noisy to track disease activity, a problem exacerbated in developing countries with limited internet access. However, recent research has shown that robust and dynamically self-correcting machine learning methodologies can extract meaningful signals from real-time search activity to track Zika and Dengue activity in low- to middle-income countries around the world [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. We apply lessons learned from these studies and successfully extend a state-of-the-art modeling approach for flu surveillance to 8 Latin American countries.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Acquisition</title>
        <p>We built a predictive methodology aimed at estimating suspected flu activity, as reported by FluNet, an online surveillance tool maintained by the WHO. FluNet collects and aggregates multiple indicators of flu activity at the country level. For this study, we selected the number of processed specimens (NPSs) as the ground truth. As these specimens were taken from patients with flu-like symptoms and then sent to a laboratory for testing, we interpreted them as an indicator of suspected flu activity in the population. Weekly aggregated NPS reports were collected from January 5, 2009, to December 25, 2016, for Argentina, Bolivia, Brazil, Chile, Mexico, Paraguay, Peru, and Uruguay.</p>
        <p>Given their near real-time availability via the online tool, Google Trends, we selected influenza-related internet search activity to be used in our models as proxies or predictors for flu activity. Where available and based on country-specific historical flu indicators (during the training time period of our models), we used the online tool, Google Correlate, to identify flu-related search term trends, leading to a total of 285 Spanish terms and 96 Portuguese terms. See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for further description of this process.</p>
      </sec>
      <sec>
        <title>Models and Benchmarks</title>
        <p>We extended AutoRegression with Google search information (ARGO), a methodology originally conceived and tested to track flu activity in the United States in multiple spatial scales as a way to produce retrospective and strictly out-of-sample flu estimates individually for each country [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. This methodology is based on a multivariable regularized linear model that is dynamically recalibrated every week as new flu activity information becomes available. Besides online search information, ARGO incorporates short-term and seasonal historical flu information to improve the accuracy of predictions and mitigate the undesired effect of spikes in search activity (induced perhaps by overreaction in the population during potential health threats reported by the news). More details on this approach can be found in a study by Yang et al [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>Given a weekly as-yet-unseen NPS report to estimate, we used historical NPS and Google Trends information from the previous most recent 2 years (104 weeks) of data to calibrate ARGO and predict the given week’s NPS report. To assess ARGO’s predictive power, we built autoregressive models separately for each country (named AR52 throughout this paper) that only use historical flu activity from the 52 weeks before predictions and generated retrospective out-of-sample estimates over the same time period. All models were built using the glmnet package on MATLAB (MathWorks) version 2014a [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
      <sec>
        <title>Metrics</title>
        <p>To compare the predictive ability of ARGO and AR52, we calculated Pearson correlations and the root mean square error between model predictions and the subsequently observed suspected flu cases. The added value of using Google search activity as a predictor was tested via an efficiency metric [<xref ref-type="bibr" rid="ref22">22</xref>] that quantifies the improvement of ARGO over a simple autoregressive model. This efficiency metric is calculated as the ratio between the mean square errors of AR52 and ARGO. For the efficiency metric, 90% CIs were generated using the stationary block bootstrap method [<xref ref-type="bibr" rid="ref24">24</xref>]. We report 2 additional metrics aimed at evaluating our method’s ability to correctly identify the timing of peaks and timing of the onset of epidemic outbreaks. These metrics are referred to as ∆P and ∆O, respectively, and measure the distance, in weeks, between the observed peak (or onsets) and the predicted one. See <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for further explanation.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>AutoRegression With Google Search Models Outperform AR52 and Google Flu Trends</title>
        <p>Retrospective out-of-sample estimates of flu activity were produced, for each of the 8 countries, from January 1, 2012, to December 25, 2016, and compared with the FluNet reported suspected cases (NPSs). Brazil’s NPS data were only available until October 9, 2016. Note that because of FluNet’s reporting delays, our models, which rely on past available values of FluNet and current internet search activity, estimate current flu activity at least 1 week ahead of official reports.</p>
        <p>In <xref ref-type="fig" rid="figure1">Figure 1</xref>, we show our real-time flu estimates and the subsequently observed suspected flu cases for each country. Contextually, historical GFT values (scaled to be displayed alongside with NPS values) and autoregressive estimates are also shown. Our models (ARGO and AR52) accurately predict NPS values in each country. GFT shows consistently large discrepancies when compared with the observed values, consistent with the findings reported by Pollett et al [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
        <p>ARGO displays improvement in 6 countries in terms of the efficiency metric (<xref ref-type="fig" rid="figure2">Figure 2</xref>), reaching significant error reductions compared with AR52 in Brazil (155 to 104 or 33%), Mexico (243 to 184 or 24%), Peru (48 to 40 or 16%), and Chile (131 to 119 or 9%). ARGO consistently outperforms GFT on Pearson correlations during the time period when GFT was active in every country and improves upon AR52 in all countries except Bolivia and Uruguay, over the whole study period, reaching significant correlation increases in Brazil (from 0.891 to 0.957), Mexico (from 0.86 to 0.92), and Peru (from 0.84 to 0.89).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Graphical representation of the number of processed specimens (NPSs) as reported by WHO’s FluNet (black), along with the NPS estimates generated by ARGO (red), AR (light blue), and Google Flu Trends (GFT; blue), over the whole study period of January 1, 2012 to December 25, 2016.</p>
          </caption>
          <graphic xlink:href="publichealth_v5i2e12214_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Set of bar graphs that show our performance metrics to assess the predictive power of AutoRegression with Google search (ARGO). (a) Efficiency metric values (salmon color) for each individual country with their respective 90% CI (solid black line). (b) Root mean square error (RMSE) values for ARGO (red) and AR52 (light blue) during the whole study period. Each country’s RMSE value is normalized by their respective average number of processed specimen (NPS) over the whole study period to avoid scale differences in visualization. c) Pearson correlation scores of ARGO and AR during the full period. d) Pearson correlation values for ARGO (red), AR (gray), and Google Flu Trends (GFT; blue) during the period in our study where GFT was active.</p>
          </caption>
          <graphic xlink:href="publichealth_v5i2e12214_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Peaks and Onsets</title>
        <p><xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> shows our method’s ability to identify the timing of peaks and timing of the onset as captured by the metrics ∆P and ∆O, respectively. Out of a total of 39 peaks, ARGO predicts 10 on the observed week, 5 ahead of time, and 24 with a lag. In contrast, AR52 predicted 7 peaks exactly, 2 ahead of time, and 30 with a lag. Out of 39 measured onsets, ARGO predicted 11 at the exact date, 12 ahead of time, and 13 with a lag, with the rest of the onsets incorrectly estimated with more than a month’s distance. AR52 predicted 8 onsets at the exact time, 8 ahead of time, 20 with a lag, and the rest were estimated with more than a month’s distance. As expected, the baseline autoregressive model, AR52, predicted more outbreak peaks late, with a lag of at least a week. ARGO, in contrast, is slightly more responsive and predicts outbreak peaks on time or weeks before the observed peak. Furthermore, even when ARGO’s peak timing is not accurate, the magnitude of the peak is captured better than its AR52 counterpart. For more detailed information, see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Combining Historical Flu Activity and Google Search Data</title>
        <p>ARGO’s prediction performance shows that internet search volumes and historical flu activity, when combined with dynamic machine learning techniques, can effectively detect real-time suspected flu cases in several Latin American countries. Our results considerably outperform the historical predictive performance of GFT highlighting (1) the importance of moving away from one-size-fits-all approaches such as those used by GFT and (b) the value of combining local flu epidemiological information with influenza-related internet search trends. The overall improvement of ARGO over the baseline autoregressive model indicates that internet search engine data, even in middle-income countries, provide increased responsiveness to changing disease trends. This improvement is clear in Brazil, Chile, Mexico, Peru, Paraguay, and Argentina, whereas in Uruguay and Bolivia, the inclusion of Google search data does not seem to improve the baseline model.</p>
        <p>The availability of an online tool to select relevant flu-related terms (Google Correlate) that track historical flu activity was found to be a critical element for ARGO to improve performance over the autoregressive benchmark (Argentina, Chile, Mexico, Peru, and Brazil), suggesting that the most meaningful flu-related search queries are country-specific. In countries, such as Uruguay, where many weekly data points were missing on FluNet, ARGO’s predictive ability was reduced. Our best performance was seen in Brazil, Mexico, and Peru, where flu data were collected consistently every week during this study’s time period (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
      </sec>
      <sec>
        <title>Number of Processed Specimens as Our Gold Standard</title>
        <p>On the basis of our previous research findings monitoring Dengue and Zika activity in Latin America [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], we chose the number of suspected influenza cases (as captured by the FluNet’s NPSs) as our gold standard for our prediction tasks. Our choice was based on the intuitive fact that flu-related Google search activity is higher when more people “suspect” they may be affected by flu-like symptoms, regardless of the outcome of any lab test. As such, our models may prove useful to improve the timely allocation of resources in health care facilities in situations when increased numbers of people, with flu-like symptoms and respiratory needs, may need to be seen. It is relevant to point out that using NPS case counts as a gold standard implies that our models are not directly estimating confirmed influenza case counts but suspected Influenza-like Illness activity trends. Our choice of gold standard is meaningful as it may help health care providers prepare for traffic fluctuations of patients presenting with symptoms of influenza. However, from an epidemiological perspective, more standard test-positive influenza proportions reported on previous Latin America studies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] should also be considered in future studies.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>Combining internet search volumes and historical flu activity via ARGO shows strong potential for the development of timely flu surveillance in low- or middle-income countries. However, flu estimates at the national level may not be reflective of outbreak conditions at the local level, especially in countries with significant geographical heterogeneity. At present, FluNet only provides national-level flu data. In the future, as more fine-grained epidemiological information becomes available in developing countries, studies should evaluate the feasibility of deploying disease surveillance platforms at finer spatial scales. Successful extensions of our methodologies at the city and state levels in data-rich environments such as the United States [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] indicate that ARGO-like methodologies can accurately monitor influenza at these spatial resolutions. Moreover, there is strong evidence that internet access is rapidly increasing in many Latin American countries [<xref ref-type="bibr" rid="ref28">28</xref>], leading us to hypothesize that the performance of methodologies using internet-based data will increase over time following an increase of the quality of Google search data.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Supplementary materials. This document includes several Tables and Figures, as well as more information regarding our Methods and Results section.</p>
        <media xlink:href="publichealth_v5i2e12214_app1.pdf" xlink:title="PDF File (Adobe PDF File), 5MB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ARGO</term>
          <def>
            <p>AutoRegression with Google search</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GFT</term>
          <def>
            <p>Google Flu Trends</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NPS</term>
          <def>
            <p>number of processed specimens</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>MS and FL were partially funded by the Centers for Disease Control and Prevention’s Cooperative 375 Agreement PPHF 11797-998G-15. LC was partially funded by a grant 734557 by the Mexico National Council of Science and Technology. MS was partially supported by the National Institute of General Medical Sciences, of the National Institutes of Health, under Award Number R01GM130668. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Savy</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Ciapponi</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bardach</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Glujovsky</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Aruj</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Mazzoni</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ortega-Barría</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Colindres</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Burden of influenza in Latin America and the Caribbean: a systematic review and meta-analysis</article-title>
        <source>Influenza Other Respir Viruses</source>  
        <year>2013</year>  
        <month>11</month>  
        <volume>7</volume>  
        <issue>6</issue>  
        <fpage>1017</fpage>  
        <lpage>32</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/irv.12036"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/irv.12036</pub-id>
        <pub-id pub-id-type="medline">23210504</pub-id>
        <pub-id pub-id-type="pmcid">PMC4634294</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Brooks</surname>
            <given-names>LC</given-names>
          </name>
          <name name-style="western">
            <surname>Farrow</surname>
            <given-names>DC</given-names>
          </name>
          <name name-style="western">
            <surname>Hyun</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Tibshirani</surname>
            <given-names>RJ</given-names>
          </name>
          <name name-style="western">
            <surname>Rosenfeld</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Flexible modeling of epidemics with an empirical Bayes Framework</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2015</year>  
        <month>08</month>  
        <volume>11</volume>  
        <issue>8</issue>  
        <fpage>e1004382</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1004382"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004382</pub-id>
        <pub-id pub-id-type="medline">26317693</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-14-01884</pub-id>
        <pub-id pub-id-type="pmcid">PMC4552841</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tibshirani</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Regression shrinkage and selection via the lasso: a retrospective</article-title>
        <source>J R Stat Soc Series B Stat Methodol</source>  
        <year>2011</year>  
        <volume>73</volume>  
        <issue>3</issue>  
        <fpage>273</fpage>  
        <lpage>82</lpage>  
        <pub-id pub-id-type="doi">10.1111/j.1467-9868.2011.00771.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shaman</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Karspeck</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Forecasting seasonal outbreaks of influenza</article-title>
        <source>Proc Natl Acad Sci U S A</source>  
        <year>2012</year>  
        <month>12</month>  
        <day>11</day>  
        <volume>109</volume>  
        <issue>50</issue>  
        <fpage>20425</fpage>  
        <lpage>30</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=23184969"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1073/pnas.1208772109</pub-id>
        <pub-id pub-id-type="medline">23184969</pub-id>
        <pub-id pub-id-type="pii">1208772109</pub-id>
        <pub-id pub-id-type="pmcid">PMC3528592</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Perra</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Perrota</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Tizzoni</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Paolotti</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Forecasting seasonal influenza fusing digital indicators and a mechanistic disease model</article-title>
        <source>Proceedings of the 26th International Conference on World Wide Web</source>  
        <year>2017</year>  
        <conf-name>WWW'17</conf-name>
        <conf-date>April 3-7, 2017</conf-date>
        <conf-loc>Perth, Australia</conf-loc>
        <fpage>311</fpage>  
        <pub-id pub-id-type="doi">10.1145/3038912.3052678</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Infodemiology: tracking flu-related searches on the web for syndromic surveillance</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2006</year>  
        <fpage>244</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17238340"/>
        </comment>  
        <pub-id pub-id-type="medline">17238340</pub-id>
        <pub-id pub-id-type="pii">86095</pub-id>
        <pub-id pub-id-type="pmcid">PMC1839505</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>You are what you Tweet: Analyzing Twitter for public health</article-title>
        <source>International AAAI Conference on Weblogs and Social Media</source>  
        <year>2011</year>  
        <conf-name>Fifth International ICWSM</conf-name>
        <conf-date>July 17-21, 2011</conf-date>
        <conf-loc>Barcelona, Spain</conf-loc>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cs.jhu.edu/~mpaul/files/2011.icwsm.twitter_health.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Smolinski</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Crawley</surname>
            <given-names>AW</given-names>
          </name>
          <name name-style="western">
            <surname>Baltrusaitis</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Chunara</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Olsen</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Wójcik</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Flu near you: crowdsourced symptom reporting spanning 2 influenza seasons</article-title>
        <source>Am J Public Health</source>  
        <year>2015</year>  
        <month>10</month>  
        <volume>105</volume>  
        <issue>10</issue>  
        <fpage>2124</fpage>  
        <lpage>30</lpage>  
        <pub-id pub-id-type="doi">10.2105/AJPH.2015.302696</pub-id>
        <pub-id pub-id-type="medline">26270299</pub-id>
        <pub-id pub-id-type="pmcid">PMC4566540</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paolotti</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Carnahan</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Colizza</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Eames</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Edmunds</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Gomes</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Koppeschaar</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Rehn</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Smallenburg</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Turbelin</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Van</surname>
            <given-names>NS</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Web-based participatory surveillance of infectious diseases: the Influenzanet participatory surveillance experience</article-title>
        <source>Clin Microbiol Infect</source>  
        <year>2014</year>  
        <month>01</month>  
        <volume>20</volume>  
        <issue>1</issue>  
        <fpage>17</fpage>  
        <lpage>21</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1198-743X(14)60188-9"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/1469-0691.12477</pub-id>
        <pub-id pub-id-type="medline">24350723</pub-id>
        <pub-id pub-id-type="pii">S1198-743X(14)60188-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Nsoesie</surname>
            <given-names>EO</given-names>
          </name>
          <name name-style="western">
            <surname>Mekaru</surname>
            <given-names>SR</given-names>
          </name>
          <name name-style="western">
            <surname>Scales</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
        </person-group>
        <article-title>Using clinicians' search query data to monitor influenza epidemics</article-title>
        <source>Clin Infect Dis</source>  
        <year>2014</year>  
        <month>11</month>  
        <day>15</day>  
        <volume>59</volume>  
        <issue>10</issue>  
        <fpage>1446</fpage>  
        <lpage>50</lpage>  
        <pub-id pub-id-type="doi">10.1093/cid/ciu647</pub-id>
        <pub-id pub-id-type="medline">25115873</pub-id>
        <pub-id pub-id-type="pii">ciu647</pub-id>
        <pub-id pub-id-type="pmcid">PMC4296132</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Gray</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Richardson</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kou</surname>
            <given-names>SC</given-names>
          </name>
        </person-group>
        <article-title>Using electronic health records and Internet search information for accurate influenza forecasting</article-title>
        <source>BMC Infect Dis</source>  
        <year>2017</year>  
        <month>05</month>  
        <day>8</day>  
        <volume>17</volume>  
        <issue>1</issue>  
        <fpage>332</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcinfectdis.biomedcentral.com/articles/10.1186/s12879-017-2424-7"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/s12879-017-2424-7</pub-id>
        <pub-id pub-id-type="medline">28482810</pub-id>
        <pub-id pub-id-type="pii">10.1186/s12879-017-2424-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC5423019</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Generous</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Deshpande</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>SY</given-names>
          </name>
          <name name-style="western">
            <surname>Priedhorsky</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Global disease monitoring and forecasting with Wikipedia</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2014</year>  
        <month>11</month>  
        <volume>10</volume>  
        <issue>11</issue>  
        <fpage>e1003892</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003892"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003892</pub-id>
        <pub-id pub-id-type="medline">25392913</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-14-00678</pub-id>
        <pub-id pub-id-type="pmcid">PMC4231164</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hickmann</surname>
            <given-names>KS</given-names>
          </name>
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Priedhorsky</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Generous</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Hyman</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Deshpande</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>SY</given-names>
          </name>
        </person-group>
        <article-title>Forecasting the 2013-2014 influenza season using Wikipedia</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>11</volume>  
        <issue>5</issue>  
        <fpage>e1004239</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1004239"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004239</pub-id>
        <pub-id pub-id-type="medline">25974758</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-14-01771</pub-id>
        <pub-id pub-id-type="pmcid">PMC4431683</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Editorial commentary: perspectives on the future of internet search engines and biosurveillance systems</article-title>
        <source>Clin Infect Dis</source>  
        <year>2017</year>  
        <month>12</month>  
        <day>1</day>  
        <volume>64</volume>  
        <issue>1</issue>  
        <fpage>42</fpage>  
        <lpage>3</lpage>  
        <pub-id pub-id-type="doi">10.1093/cid/ciw660</pub-id>
        <pub-id pub-id-type="medline">27678086</pub-id>
        <pub-id pub-id-type="pii">ciw660</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ginsberg</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Mohebbi</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Patel</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Brammer</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Smolinski</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Brilliant</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Detecting influenza epidemics using search engine query data</article-title>
        <source>Nature</source>  
        <year>2009</year>  
        <month>02</month>  
        <day>19</day>  
        <volume>457</volume>  
        <issue>7232</issue>  
        <fpage>1012</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
        <pub-id pub-id-type="medline">19020500</pub-id>
        <pub-id pub-id-type="pii">nature07634</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Althouse</surname>
            <given-names>BM</given-names>
          </name>
          <name name-style="western">
            <surname>Ayers</surname>
            <given-names>JW</given-names>
          </name>
        </person-group>
        <article-title>What can digital disease detection learn from (an external revision to) Google Flu Trends?</article-title>
        <source>Am J Prev Med</source>  
        <year>2014</year>  
        <month>09</month>  
        <volume>47</volume>  
        <issue>3</issue>  
        <fpage>341</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.amepre.2014.05.020</pub-id>
        <pub-id pub-id-type="medline">24997572</pub-id>
        <pub-id pub-id-type="pii">S0749-3797(14)00238-4</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lazer</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Kennedy</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>King</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Big data. The parable of Google Flu: traps in big data analysis</article-title>
        <source>Science</source>  
        <year>2014</year>  
        <month>03</month>  
        <day>14</day>  
        <volume>343</volume>  
        <issue>6176</issue>  
        <fpage>1203</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.1126/science.1248506</pub-id>
        <pub-id pub-id-type="medline">24626916</pub-id>
        <pub-id pub-id-type="pii">343/6176/1203</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Olson</surname>
            <given-names>DR</given-names>
          </name>
          <name name-style="western">
            <surname>Konty</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Paladini</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Viboud</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Simonsen</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Reassessing Google Flu Trends data for detection of seasonal and pandemic influenza: a comparative epidemiological study at three geographic scales</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2013</year>  
        <volume>9</volume>  
        <issue>10</issue>  
        <fpage>e1003256</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003256"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003256</pub-id>
        <pub-id pub-id-type="medline">24146603</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-13-00957</pub-id>
        <pub-id pub-id-type="pmcid">PMC3798275</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pollett</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Boscardin</surname>
            <given-names>WJ</given-names>
          </name>
          <name name-style="western">
            <surname>Azziz-Baumgartner</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Tinoco</surname>
            <given-names>YO</given-names>
          </name>
          <name name-style="western">
            <surname>Soto</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Romero</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kok</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Biggerstaff</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Viboud</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Rutherford</surname>
            <given-names>GW</given-names>
          </name>
        </person-group>
        <article-title>Evaluating Google Flu Trends in Latin America: important lessons for the next phase of digital disease detection</article-title>
        <source>Clin Infect Dis</source>  
        <year>2017</year>  
        <month>01</month>  
        <day>1</day>  
        <volume>64</volume>  
        <issue>1</issue>  
        <fpage>34</fpage>  
        <lpage>41</lpage>  
        <pub-id pub-id-type="doi">10.1093/cid/ciw657</pub-id>
        <pub-id pub-id-type="medline">27678084</pub-id>
        <pub-id pub-id-type="pii">ciw657</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kou</surname>
            <given-names>SC</given-names>
          </name>
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Brooke</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Advances in using Internet searches to track dengue</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2017</year>  
        <month>07</month>  
        <volume>13</volume>  
        <issue>7</issue>  
        <fpage>e1005607</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1005607"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1005607</pub-id>
        <pub-id pub-id-type="medline">28727821</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-16-02052</pub-id>
        <pub-id pub-id-type="pmcid">PMC5519005</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>McGough</surname>
            <given-names>SF</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Hawkins</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Forecasting Zika incidence in the 2016 Latin America outbreak combining traditional disease surveillance with search, social media, and news report data</article-title>
        <source>PLoS Negl Trop Dis</source>  
        <year>2017</year>  
        <month>12</month>  
        <volume>11</volume>  
        <issue>1</issue>  
        <fpage>e0005295</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pntd.0005295"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pntd.0005295</pub-id>
        <pub-id pub-id-type="medline">28085877</pub-id>
        <pub-id pub-id-type="pii">PNTD-D-16-01733</pub-id>
        <pub-id pub-id-type="pmcid">PMC5268704</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kou</surname>
            <given-names>SC</given-names>
          </name>
        </person-group>
        <article-title>Accurate estimation of influenza epidemics using Google search data via ARGO</article-title>
        <source>Proc Natl Acad Sci U S A</source>  
        <year>2015</year>  
        <month>11</month>  
        <day>24</day>  
        <volume>112</volume>  
        <issue>47</issue>  
        <fpage>14473</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=26553980"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1073/pnas.1515373112</pub-id>
        <pub-id pub-id-type="medline">26553980</pub-id>
        <pub-id pub-id-type="pii">1515373112</pub-id>
        <pub-id pub-id-type="pmcid">PMC4664296</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Qian</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hastie</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Tibshirani</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Simon</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <source>WebCite</source>  
        <year>2013</year>  
        <access-date>2019-02-28</access-date>
        <comment>Glmnet in Matlab 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.webcitation.org/76YjrZOGa">http://www.webcitation.org/76YjrZOGa</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="76Yk0dh0J"/></comment> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Politis</surname>
            <given-names>DN</given-names>
          </name>
          <name name-style="western">
            <surname>Romano</surname>
            <given-names>JP</given-names>
          </name>
        </person-group>
        <article-title>The stationary bootstrap</article-title>
        <source>J Am Stat Assoc</source>  
        <year>2012</year>  
        <month>02</month>  
        <day>27</day>  
        <volume>89</volume>  
        <issue>428</issue>  
        <fpage>1303</fpage>  
        <lpage>13</lpage>  
        <pub-id pub-id-type="doi">10.1080/01621459.1994.10476870</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Durand</surname>
            <given-names>LO</given-names>
          </name>
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Palekar</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Clara</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Jara</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cerpa</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>el Omeiri</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Ropero-Alvarez</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Ramirez</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Araya</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Acosta</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Bruno</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>de Lozano</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Castillo Signor</surname>
            <given-names>LD</given-names>
          </name>
          <name name-style="western">
            <surname>Matute</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>Jackson-Betty</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mung</surname>
            <given-names>KS</given-names>
          </name>
          <name name-style="western">
            <surname>Díaz-Quiñonez</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>López-Martinez</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Balmaseda</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Arévalo</surname>
            <given-names>BM</given-names>
          </name>
          <name name-style="western">
            <surname>Vazquez</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Gutierrez</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Garten</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Widdowson</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Azziz-Baumgartner</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Timing of influenza epidemics and vaccines in the American tropics, 2002-2008, 2011-2014</article-title>
        <source>Influenza Other Respir Viruses</source>  
        <year>2016</year>  
        <month>05</month>  
        <volume>10</volume>  
        <issue>3</issue>  
        <fpage>170</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/irv.12371"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/irv.12371</pub-id>
        <pub-id pub-id-type="medline">26701079</pub-id>
        <pub-id pub-id-type="pmcid">PMC4814866</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>FS</given-names>
          </name>
          <name name-style="western">
            <surname>Hou</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Baltrusaitis</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Leskovec</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sosic</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hawkins</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Conidi</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Gunn</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Gray</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Zink</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Accurate influenza monitoring and forecasting using novel Internet data streams: a case study in the Boston Metropolis</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2018</year>  
        <month>01</month>  
        <day>9</day>  
        <volume>4</volume>  
        <issue>1</issue>  
        <fpage>e4</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/1/e4/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.8950</pub-id>
        <pub-id pub-id-type="medline">29317382</pub-id>
        <pub-id pub-id-type="pii">v4i1e4</pub-id>
        <pub-id pub-id-type="pmcid">PMC5780615</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>FS</given-names>
          </name>
          <name name-style="western">
            <surname>Hattab</surname>
            <given-names>MW</given-names>
          </name>
          <name name-style="western">
            <surname>Clemente</surname>
            <given-names>CL</given-names>
          </name>
          <name name-style="western">
            <surname>Biggerstaff</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Santillana</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Improved state-level influenza nowcasting in the United States leveraging internet-based data and network approaches</article-title>
        <source>Nat Commun</source>  
        <year>2019</year>  
        <month>12</month>  
        <day>11</day>  
        <volume>10</volume>  
        <issue>1</issue>  
        <fpage>147</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30635558"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/s41467-018-08082-0</pub-id>
        <pub-id pub-id-type="medline">30635558</pub-id>
        <pub-id pub-id-type="pii">10.1038/s41467-018-08082-0</pub-id>
        <pub-id pub-id-type="pmcid">PMC6329822</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
        <source>International Telecommunication Union</source>  
        <access-date>2019-02-08</access-date>
        <comment>Statistics 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.itu.int/en/ITU-D/Statistics/Pages/stat/default.aspx">https://www.itu.int/en/ITU-D/Statistics/Pages/stat/default.aspx</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="761ThSiLh"/></comment> </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
