<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id><journal-id journal-id-type="publisher-id">publichealth</journal-id><journal-id journal-id-type="index">9</journal-id><journal-title>JMIR Public Health and Surveillance</journal-title><abbrev-journal-title>JMIR Public Health Surveill</abbrev-journal-title><issn pub-type="epub">2369-2960</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e59971</article-id><article-id pub-id-type="doi">10.2196/59971</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Meeting Global Health Needs via Infectious Disease Forecasting: Development of a Reliable Data-Driven Framework</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Keshavamurthy</surname><given-names>Ravikiran</given-names></name><degrees>BVSc, MVSc, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pazdernik</surname><given-names>Karl T</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ham</surname><given-names>Colby</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dixon</surname><given-names>Samuel</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Erwin</surname><given-names>Samantha</given-names></name><degrees>MS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Charles</surname><given-names>Lauren E</given-names></name><degrees>DVM, MS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Artificial Intelligence and Data Analytics Division, Pacific Northwest National Laboratory</institution><addr-line>902 Battelle Boulevard</addr-line><addr-line>Richland</addr-line><addr-line>WA</addr-line><country>United States</country></aff><aff id="aff2"><institution>Paul G. Allen School for Global Health, Washington State University</institution><addr-line>Pullman</addr-line><addr-line>WA</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Statistics, North Carolina State University</institution><addr-line>Raleigh</addr-line><addr-line>NC</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sahu</surname><given-names>Kirti Sundar</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Ma</surname><given-names>Simin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Hua</surname><given-names>Yining</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Lauren E Charles, DVM, MS, PhD, Artificial Intelligence and Data Analytics Division, Pacific Northwest National Laboratory, 902 Battelle Boulevard, Richland, WA, 99354, United States; <email>lauren.charles@pnnl.gov</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>21</day><month>3</month><year>2025</year></pub-date><volume>11</volume><elocation-id>e59971</elocation-id><history><date date-type="received"><day>27</day><month>04</month><year>2024</year></date><date date-type="rev-recd"><day>10</day><month>12</month><year>2024</year></date><date date-type="accepted"><day>24</day><month>12</month><year>2024</year></date></history><copyright-statement>&#x00A9; Ravikiran Keshavamurthy, Karl T Pazdernik, Colby Ham, Samuel Dixon, Samantha Erwin, Lauren E Charles. Originally published in JMIR Public Health and Surveillance (<ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>), 21.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://publichealth.jmir.org/2025/1/e59971"/><abstract><sec><title>Background</title><p>Infectious diseases (IDs) have a significant detrimental impact on global health. Timely and accurate ID forecasting can result in more informed implementation of control measures and prevention policies.</p></sec><sec><title>Objective</title><p>To meet the operational decision-making needs of real-world circumstances, we aimed to build a standardized, reliable, and trustworthy ID forecasting pipeline and visualization dashboard that is generalizable across a wide range of modeling techniques, IDs, and global locations.</p></sec><sec sec-type="methods"><title>Methods</title><p>We forecasted 6 diverse, zoonotic diseases (brucellosis, campylobacteriosis, Middle East respiratory syndrome, Q fever, tick-borne encephalitis, and tularemia) across 4 continents and 8 countries. We included a wide range of statistical, machine learning, and deep learning models (n=9) and trained them on a multitude of features (average n=2326) within the One Health landscape, including demography, landscape, climate, and socioeconomic factors. The pipeline and dashboard were created in consideration of crucial operational metrics&#x2014;prediction accuracy, computational efficiency, spatiotemporal generalizability, uncertainty quantification, and interpretability&#x2014;which are essential to strategic data-driven decisions.</p></sec><sec sec-type="results"><title>Results</title><p>While no single best model was suitable for all disease, region, and country combinations, our ensemble technique selects the best-performing model for each given scenario to achieve the closest prediction. For new or emerging diseases in a region, the ensemble model can predict how the disease may behave in the new region using a pretrained model from a similar region with a history of that disease. The data visualization dashboard provides a clean interface of important analytical metrics, such as ID temporal patterns, forecasts, prediction uncertainties, and model feature importance across all geographic locations and disease combinations.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>As the need for real-time, operational ID forecasting capabilities increases, this standardized and automated platform for data collection, analysis, and reporting is a major step forward in enabling evidence-based public health decisions and policies for the prevention and mitigation of future ID outbreaks.</p></sec></abstract><kwd-group><kwd>disease forecasting</kwd><kwd>machine learning</kwd><kwd>deep learning</kwd><kwd>epidemiology</kwd><kwd>One Health</kwd><kwd>decision-making</kwd><kwd>data visualization</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The frequency and magnitude of infectious disease (ID) events have seen a drastic incline in the past few decades, mainly attributed to climate change, urbanization, and globalization [<xref ref-type="bibr" rid="ref1">1</xref>]. These events often involve the emergence of novel infectious agents or the re-emergence of a previously known pathogen. Timely and accurate prediction of such ID events is crucial for decision makers to decrease associated mortality, morbidity, and economic losses [<xref ref-type="bibr" rid="ref2">2</xref>]. However, the complex and unpredictable nature of pathogen ecology makes forecasting the spatiotemporal dynamics of IDs a challenging task [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Digital information related to ID events is being generated and shared faster than ever before. Additionally, information associated with disease occurrence, such as meteorology, socioeconomics, demographics, land use, agriculture, social media, and internet trends, is often readily available [<xref ref-type="bibr" rid="ref4">4</xref>]. To keep up with this unprecedented amount of data being generated, machine learning (ML)&#x2013; and deep learning (DL)&#x2013;based algorithms are being adopted by the research community. These methods have shown to be better at detecting cryptic patterns arising from interactions between multiple features, which are difficult, often impossible at times, to uncover with conventional prediction methods [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>The time-series models have been previously used for forecasting ID events including brucellosis [<xref ref-type="bibr" rid="ref6">6</xref>], Middle East respiratory syndrome [<xref ref-type="bibr" rid="ref7">7</xref>], campylobacteriosis [<xref ref-type="bibr" rid="ref8">8</xref>], and Q fever [<xref ref-type="bibr" rid="ref5">5</xref>]. However, over the last decade, especially after the COVID-19 pandemic outbreak, considerable progress has been made in the field of ID surveillance, as the disease diagnosis, reporting, and intelligence-sharing infrastructure continue to grow on a global scale [<xref ref-type="bibr" rid="ref9">9</xref>]. Dixion et al [<xref ref-type="bibr" rid="ref5">5</xref>] compared the performance of various forecasting approaches across several diseases and countries and found that tree-based techniques had better predictive performance compared to statistical and DL techniques. Integrating diverse large-scale epidemiological data from multiple sources has further enhanced the accuracy and utility of disease prediction models [<xref ref-type="bibr" rid="ref10">10</xref>]. Ensemble forecasting techniques, which merge predictions from multiple models, offer notable advantages over single-model approaches [<xref ref-type="bibr" rid="ref11">11</xref>]. For example, Reich et al [<xref ref-type="bibr" rid="ref12">12</xref>] used real-time multimodel ensembles for seasonal influenza in the United States, while Ma et al [<xref ref-type="bibr" rid="ref13">13</xref>] demonstrated the effectiveness of integrating internet search data along with ensemble forecasting techniques to jointly forecast COVID-19 and influenza-like illnesses, underscoring the value of diverse data sources in public health forecasting.</p><p>Despite several advantages, ML and DL techniques do come with a number of limitations, making them less desirable in the real-world operational setting. We conducted a scoping systematic review to determine the status and advances made in the field of ID prediction using ML and DL, which were published elsewhere [<xref ref-type="bibr" rid="ref9">9</xref>]. One of our focuses in this systematic review was to identify if and how researchers were incorporating the necessary methods required to eventually enable the operational deployment of their ID forecasting models. Through this work, we identified multiple shortcomings in published modeling techniques that could hinder their ability to support operational biopreparedness and decision-making. Even though most of the studies focused on increasing the prediction accuracy of their models, which is critical for operational deployment, they did not address other important decision-making metrics such as computational efficiency, uncertainty quantification, interpretability, and generalizability. Modern ML and DL techniques are performance-driven, that is, they aim to generate better predictive or classification accuracy by minimizing errors [<xref ref-type="bibr" rid="ref14">14</xref>]. As a result, other metrics that are crucial for operational decision-making are often overlooked by the scientific community. First, as the structural and functional complexities of the forecasting models evolve, the computational resources required to train such models also grow considerably. In addition, these complexities result in an expanded number of model hyperparameters that can be individually tuned using numerous possible techniques. This ever-increasing complexity gives rise to an even larger problem space with highly variable results. Second, since most of these techniques are nonparametric in nature, model uncertainties are not inherently estimated. Hence, model uncertainties are often overlooked even though these estimates are crucial for systematic and transparent decision-making [<xref ref-type="bibr" rid="ref15">15</xref>]. Third, ML and DL models are considered black boxes, meaning that their internal logic and inner workings are mostly hidden from the end user [<xref ref-type="bibr" rid="ref9">9</xref>]. Consequently, verifying and understanding the rationale behind the model forecasts are difficult and often neglected. With the above considerations in mind, we developed an ID forecasting pipeline that holistically focuses on these often neglected yet essential performance metrics required for operational decision support. By incorporating this pipeline into an interactive dashboard, we created a capability that allows users to easily visualize the ID forecasting results for use in operational planning and decision-making.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>The graphical flowchart illustrating our forecasting pipeline including data ingest, preprocessing, model training, prediction, and visualization is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Graphical flowchart illustrating the infectious disease forecasting pipeline. ARIMA: autoregressive integrated moving average; LGBM: light gradient boosting machine; LSTM: long short-term memory; PI: prediction interval; RF: random forest; RNN: recurrent neural network; SARIMAX: seasonal autoregressive integrated moving average with exogenous factors; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e59971_fig01.png"/></fig></sec><sec id="s2-2"><title>Case Count Data</title><p>The model outcome variable was case counts collected from EpiArchive [<xref ref-type="bibr" rid="ref16">16</xref>] and Food and Agriculture Organization&#x2019;s Emergency Prevention System-I [<xref ref-type="bibr" rid="ref17">17</xref>]. We included the most consistent, available, and interpretable disease case counts from these sources. These data also included locations that reported only 0 disease cases. In instances where only the disease presence was reported without any information about the exact number of cases, the region, or the date of occurrence, such disease-location combinations were excluded from the analysis. We included all the diseases that spanned across multiple countries or regions and had a consistent reporting of disease events for our study period. Data were collected at the regional-level resolution for each country from January 2014 to December 2018, which contained case counts at either the weekly or monthly temporal resolution.</p></sec><sec id="s2-3"><title>Feature Data</title><p>We collected feature data from a variety of open sources across the One Health landscape (<xref ref-type="table" rid="table1">Table 1</xref>). Broadly, the features included historic case counts (case count lags up to 6 months), country census data, socioeconomic factors, health data, agricultural trade data, landscape, and climate records. The feature information varied in spatial and temporal resolutions; data were typically available at monthly or yearly resolutions and covered either the country or regional level. A complete list of countries, regions, and the total number of features collected for each region is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The input feature data types, source, feature description by name, geographic location, geographic resolution, time period, and periodicity. The table was originally published by Dixon et al [<xref ref-type="bibr" rid="ref5">5</xref>].</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Data type</td><td align="left" valign="bottom">Individual features</td><td align="left" valign="bottom">Geographic location</td><td align="left" valign="bottom">Geographic resolution</td><td align="left" valign="bottom">Time period</td><td align="left" valign="bottom">Periodicity</td></tr></thead><tbody><tr><td align="left" valign="top">Case counts [<xref ref-type="bibr" rid="ref16">16</xref>]</td><td align="left" valign="top">Incidences of select human diseases</td><td align="left" valign="top">Countries of interest</td><td align="left" valign="top">Region level</td><td align="left" valign="top">2009-2018</td><td align="left" valign="top">Daily</td></tr><tr><td align="left" valign="top">Political borders [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top">Geopolitical borders (country and within the country)</td><td align="left" valign="top">Countries of interest</td><td align="left" valign="top">Region level</td><td align="left" valign="top">2018</td><td align="left" valign="top">Single instance</td></tr><tr><td align="left" valign="top">Climate [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Air temperature, humidity, precipitation, soil moisture, and wind speed</td><td align="left" valign="top">Global</td><td align="left" valign="top">Gridded 0.25 &#x00B0;&#x00D7;0.25 &#x00B0;, 1 &#x00B0;&#x00D7;1 &#x00B0;</td><td align="left" valign="top">2012&#x2010;2018</td><td align="left" valign="top">Monthly</td></tr><tr><td align="left" valign="top">Gross domestic product [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">Gross domestic product</td><td align="left" valign="top">Global</td><td align="left" valign="top">Country level</td><td align="left" valign="top">Varies</td><td align="left" valign="top">Yearly</td></tr><tr><td align="left" valign="top">Elevation [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Digital elevation map</td><td align="left" valign="top">Global</td><td align="left" valign="top">43,200&#x00D7;17,200 (30 arc seconds)</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">N/A</td></tr><tr><td align="left" valign="top">Mortality [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">Deaths by country, year, sex, age group, and cause of death</td><td align="left" valign="top">Global</td><td align="left" valign="top">Country level</td><td align="left" valign="top">2009&#x2010;2018</td><td align="left" valign="top">Yearly</td></tr><tr><td align="left" valign="top">Municipal waste [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Municipal waste generation and treatment</td><td align="left" valign="top">Countries of interest</td><td align="left" valign="top">Country level</td><td align="left" valign="top">2009&#x2010;2017</td><td align="left" valign="top">Yearly</td></tr><tr><td align="left" valign="top">Sociopolitical and physical data [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">Socioeconomic and political attributes</td><td align="left" valign="top">Global</td><td align="left" valign="top">Varies by country; 1: 10-110 m</td><td align="left" valign="top">2019</td><td align="left" valign="top">Single instance</td></tr><tr><td align="left" valign="top">Population [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">Population by age intervals by location</td><td align="left" valign="top">Global</td><td align="left" valign="top">Country level</td><td align="left" valign="top">2009&#x2010;2015</td><td align="left" valign="top">Every 5 years</td></tr><tr><td align="left" valign="top">Population density [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">Population density</td><td align="left" valign="top">Global</td><td align="left" valign="top">30 arc seconds</td><td align="left" valign="top">2009&#x2010;2015</td><td align="left" valign="top">Every 5 years</td></tr><tr><td align="left" valign="top">Water potability and treatment [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Freshwater resources, available water, wastewater treatment plant capacity, surface water</td><td align="left" valign="top">Countries of interest</td><td align="left" valign="top">Country level</td><td align="left" valign="top">2009&#x2010;2017</td><td align="left" valign="top">Yearly</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>N/A: not applicable.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-4"><title>Data Preparation and Imputation</title><p>The harvested raw data contained information at varied spatial and temporal resolutions in different file formats. These raw data were harmonized to create the final datasets containing monthly case counts and input features for each region within the country. In situations where the feature data at the regional level were missing, the features aggregated by an average at the national level were used. Any features with more than 20% missing values across all regions and dates were not included as a predictor variable. The remaining missing values were imputed temporally using spline and forward-fill techniques for monthly and yearly feature data, respectively. Some features could not easily be imputed temporally through these techniques but were still sufficiently prevalent across regions to include in the models. In these instances, the majority of the missing data (less than 20% overall) came from only a few select regions. For these special cases, we performed geoimputation using the k-nearest neighbor method and restricted input to only regional feature data within the same country. We used distance-based weights for the features with 5 neighboring samples for imputation. The imputation techniques were implemented using the &#x201C;pandas&#x201D; and &#x201C;skforecast&#x201D; libraries in Python (Python Software Foundation) [<xref ref-type="bibr" rid="ref26">26</xref>].</p></sec><sec id="s2-5"><title>Model Choice</title><sec id="s2-5-1"><title>Overview</title><p>In our analysis, we included the following models discussed in detail below: statistical time-series models (ie, autoregressive integrated moving average [ARIMA], seasonal autoregressive integrated moving average with exogenous factors [SARIMAX], and Prophet), tree-based models (ie, random forest [RF], extreme gradient boosting [XGB], and light gradient boosting machine [LBGM]), and DL models (recurrent neural network [RNN], long short-term memory [LSTM], and transformer).</p></sec><sec id="s2-5-2"><title>Statistical Time-Series Models</title><p>The ARIMA model is a traditional statistical technique used in time-series forecasting. These models use a linear, regression-type equation, in which the predictors are lags of the dependent variable or lags of the forecast errors. The SARIMAX is an extension of ARIMA that takes seasonal trends into account within time-series data. Because SARIMAX can also accommodate exogenous features, it is often preferable to traditional ARIMA. However, SARIMAX models may fail to converge if those exogenous features are highly correlated. To overcome this issue, the least absolute shrinkage and selection operator (LASSO) regression was used for feature selection and dimensionality reduction. These LASSO-selected features were later used as input variables for SARIMAX. The modeling techniques were implemented using &#x201C;statsmodels&#x201D; and &#x201C;sklearn&#x201D; libraries in Python [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p><p>Prophet is a decomposable time-series model that uses 3 main components to make its forecasts, namely, trend, seasonality, and holidays [<xref ref-type="bibr" rid="ref30">30</xref>]. The trend component models the nonperiodic changes in the time series. Seasonality models the periodic, or seasonal, changes in the time series; this can be an important part of a disease forecasting model, as many diseases have seasonal trends. The Prophet model was implemented using the &#x201C;darts&#x201D; library in Python [<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec><sec id="s2-5-3"><title>Tree-Based ML Models</title><p>Tree-based models make predictions by creating decision trees that divide the feature space using a series of binary decision thresholds. The RF is an extension of the decision tree method that uses an ensemble of decision trees to increase performance and reduce the risk of overfitting the training data. The XGB is an implementation of a decision tree that uses stochastic gradient boosting to sequentially improve prediction during training. Because of this methodology, XGB achieves superior accuracy in prediction tasks. LGBM is similar to XGB; however, it also applies a novel sampling method and feature bundling process that allows the method to get comparable performance to XGB but uses far less memory and trains much faster. These modeling techniques were implemented using &#x201C;skforecast&#x201D; library in Python [<xref ref-type="bibr" rid="ref32">32</xref>].</p></sec><sec id="s2-5-4"><title>DL Models</title><p>The RNN is built on DL architecture with a hidden state that memorizes sequential data. This added process provides the model with an understanding of temporal information in a time-series sequence. The LSTM is an extension of RNN with additional parameters that incorporate different scales of temporal information, which allow the model to effectively use both long- and short-term temporal data in its prediction. Hence, these models are routinely used in disease forecasting tasks.</p><p>Transformers [<xref ref-type="bibr" rid="ref33">33</xref>] are another form of DL architecture that has been recently outperforming other models in many applications of ML. These models leverage a structure known as &#x201C;attention,&#x201D; which allows them to model dependence in both short and long temporal lags. Unfortunately, these models are especially slow to train and often require very large amounts of data and computational power. The DL techniques were implemented as an encoder-record architecture using &#x201C;darts&#x201D; library in Python.</p></sec></sec><sec id="s2-6"><title>Model Training and Prediction</title><p>The model training involved hyperparameter tuning and model fitting, whereas model testing involved generating 1-step ahead forecasts (ie, monthly) and their prediction intervals (PIs). When creating predictions, all feature data and disease case counts up until the time of prediction were included in the model. The model training included hyperparameter tuning using a 5-fold time-series cross-validation split and model fitting. First, the models were trained using 2014&#x2010;2016 data and tested on 2017 data. Subsequently, the model was retrained using 2014&#x2010;2017 data and tested on 2018 data in a sliding window manner. A detailed description of model-specific hyperparameters and their search space used for model training is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-7"><title>Model Evaluation</title><p>The forecasting models were evaluated in two ways: (1) <italic>F</italic><sub>1</sub>-score to evaluate the ability of a model to predict the presence or absence of a disease in each region (ie, did the region report 1 or more cases during the testing period) and (2) mean absolute error (MAE) for the subset of predictions where the disease was detected in a region (case counts greater than 0). The multimetric approach was adopted because of the high frequency of time-location pairs that had no disease present. Without separating these results, the MAE metric was largely driven by the results of the high-frequency disease and regions. Finally, we created ensemble models by selecting the best-performing technique based on the MAE of the testing dataset. Other metrics such as precision, recall, negative predictive value, true negatives, false positives, false negatives, and true positives were also estimated but not considered when building our ensemble model.</p></sec><sec id="s2-8"><title>Uncertainty Quantification and Interpretability</title><p>The 95% PIs for our forecasted values were estimated to account for forecasting uncertainties. For statistical models (ARIMA, SARIMAX, and Prophet), PIs were readily obtained along with the model forecasts as a natural consequence of the model construction. However, PIs were not directly available for ML and DL techniques. Hence, we used Python packages that retroactively produced PIs using alternate techniques. The PIs for tree-based models (RF, XGB, and LGBM) were estimated by a bootstrapping technique using &#x201C;skforecast&#x201D; library, whereas for DL models (RNN, LSTM, and transformer), PIs were calculated by a nonparametric method known as quantile regression using the &#x201C;Darts&#x201D; library [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. For each model forecast, we estimated the coverage probability of the 95% PIs (ie, instances where the PIs surrounded the true value) as a measure of calibration assessment for the prediction uncertainties.</p><p>Feature importance, based on Shapley Additive Explanation (SHAP) values for the best-performing models, was used as a generalized approach to interpretability for tree-based and DL models [<xref ref-type="bibr" rid="ref34">34</xref>]. SARIMAX was the only statistical model that allowed for feature input and interpretability, which was provided by coefficient estimates from the model. However, the SARIMAX model was unable to incorporate the large number of features available for each region. To address this limitation, a feature selection approach was applied using LASSO regression to reduce the model&#x2019;s input variables.</p><p>The historic case count data are important and most frequently used predictive features in the ID prediction domain [<xref ref-type="bibr" rid="ref9">9</xref>]. In our analysis, we used case count lags up to 6 months. To estimate the relative importance of these case count lags compared to other features, we calculated 2 metrics, namely, the feature ratio and mean reciprocal rank (MRR). A threshold of the top 10 features, as deemed by the models, was set to estimate the feature ratio and MRR. The feature ratio was the total number of lag case count features divided by the total number of features (up to the top 10 features). The MRR, on the other hand, also considers the position of the first relevant item in the ranked list, that is, case count lags. The MRR was defined as the mean of reciprocal ranks of case count lags across all features. The values range from 0 to 1, with a higher score signifying the greater relative feature importance rank of case count lags compared to other features for obtaining model forecasts.</p></sec><sec id="s2-9"><title>Spatial Generalizability Using Transfer Learning</title><p>We used the transfer learning framework to test the models for their ability to produce accurate forecasts in regions that were fairly new to the disease. These regions were strategically picked by maximizing the global coverage and following the stratified random sampling framework. First, only the country-disease combinations where case count data were available were selected. This process also included the regions that reported 0 disease cases during our study period. Next, one region within the selected countries was randomly picked and denoted as the target region. Then, we selected a similar region to the target region to train the transfer learning models based on (1) the target and similar region being part of the same country and (2) the target and similar region containing comparable case counts over the last 6 months. The similar region pretrained model was then used to forecast the disease case counts of the target region, and performance was assessed.</p></sec><sec id="s2-10"><title>Ethical Considerations</title><p>Data used in this study are open source and do not identify individual information, either directly or indirectly. Therefore, this research was exempted from ethical review.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>The summary statistics of the disease-location combinations aggregated at the country level are presented in <xref ref-type="table" rid="table2">Table 2</xref>, whereas a detailed breakdown of this summary for both test and train split is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Median (IQR) regional case counts per country and disease for the entire dataset from January 2014 to December 2018.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Disease</td><td align="left" valign="bottom" colspan="8">Country</td></tr><tr><td align="left" valign="top"/><td align="left" valign="bottom">Australia, median (IQR)</td><td align="left" valign="bottom">Germany, median (IQR)</td><td align="left" valign="bottom">Israel, median (IQR)</td><td align="left" valign="bottom">Japan, median (IQR)</td><td align="left" valign="bottom">Norway, median (IQR)</td><td align="left" valign="bottom">Saudi Arabia, median (IQR)</td><td align="left" valign="bottom">Sweden, median (IQR)</td><td align="left" valign="bottom">United States, median (IQR)</td></tr></thead><tbody><tr><td align="left" valign="top">Brucellosis</td><td align="left" valign="top">3 (0-29)</td><td align="left" valign="top">11 (0-42)</td><td align="left" valign="top">30 (0-1072)</td><td align="left" valign="top">0 (0-3)</td><td align="left" valign="top">0 (0-2)</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">1 (0-2)</td><td align="left" valign="top">4 (0-25)</td></tr><tr><td align="left" valign="top">Campylobacteriosis</td><td align="left" valign="top">7904 (0-43,205)</td><td align="left" valign="top">148,616 ( 50,644-197,616)</td><td align="left" valign="top">998 (0-7666)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">306 (0-1456)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1103 (0-10,815)</td><td align="left" valign="top">1159 (0-25,327)</td></tr><tr><td align="left" valign="top">MERS<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">0 (0-0)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0 (0-0)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">3 (0-71)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Q fever</td><td align="left" valign="top">55 (0-974)</td><td align="left" valign="top">28 (0-769)</td><td align="left" valign="top">46 (0-103)</td><td align="left" valign="top">0 (0-1)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">5 (0-26)</td></tr><tr><td align="left" valign="top">Tick-borne encephalitis</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">15 (0-897)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0 (0-2)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Tularemia</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0 (0-0)</td><td align="left" valign="top">0 (0-1)</td><td align="left" valign="top">15 (0-69)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">4 (0-89)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Not available.</p></fn><fn id="table2fn2"><p><sup>b</sup>MERS: Middle East respiratory syndrome.</p></fn></table-wrap-foot></table-wrap><p>There were 757 disease-region combinations ran through 9 different models in this study. As the first step, we calculated <italic>F</italic><sub>1</sub>-scores to determine the ability of the forecasting models to detect the presence or absence of a disease in a given region (<xref ref-type="table" rid="table3">Table 3</xref>). Overall, tree-based models (ie, XGB, RF, and LGBM) and Prophet consistently had better and comparable <italic>F</italic><sub>1</sub>-scores across the diseases. The DL models (ie, RNN, transformer, and LSTM) had significantly lower <italic>F</italic><sub>1</sub>-scores. Patterns were consistent across all diseases in each region. The additional evaluation metrics for model and disease combination including precision, recall, negative predictive value, true negatives, false positives, false negatives, and true positives are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p><italic>F</italic><sub>1</sub>-score for all models forecasting the presence or absence of disease for each region in 2017 and 2018.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Disease</td><td align="left" valign="bottom" colspan="9">Model</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">ARIMA<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">LGBM<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">LSTM<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="bottom">Prophet</td><td align="left" valign="bottom">RF<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom">RNN<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="bottom">SARIMAX<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="bottom">Transformer</td><td align="left" valign="bottom">XGB<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="bottom">Brucellosis</td><td align="char" char="." valign="bottom">0.65</td><td align="char" char="." valign="bottom">0.67</td><td align="char" char="." valign="bottom">0.55</td><td align="char" char="." valign="bottom">0.69</td><td align="char" char="." valign="bottom">0.67</td><td align="char" char="." valign="bottom">0.56</td><td align="char" char="." valign="bottom">0.66</td><td align="char" char="." valign="bottom">0.59</td><td align="char" char="." valign="bottom">0.67</td></tr><tr><td align="left" valign="bottom">Campylobacteriosis</td><td align="char" char="." valign="bottom">0.93</td><td align="char" char="." valign="bottom">0.96</td><td align="char" char="." valign="bottom">0.96</td><td align="char" char="." valign="bottom">0.97</td><td align="char" char="." valign="bottom">0.96</td><td align="char" char="." valign="bottom">0.95</td><td align="char" char="." valign="bottom">0.91</td><td align="char" char="." valign="bottom">0.94</td><td align="char" char="." valign="bottom">0.96</td></tr><tr><td align="left" valign="bottom">MERS<sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td><td align="char" char="." valign="bottom">0.98</td><td align="char" char="." valign="bottom">0.90</td><td align="char" char="." valign="bottom">0.60</td><td align="char" char="." valign="bottom">0.90</td><td align="char" char="." valign="bottom">0.90</td><td align="char" char="." valign="bottom">0.61</td><td align="char" char="." valign="bottom">0.95</td><td align="char" char="." valign="bottom">0.56</td><td align="char" char="." valign="bottom">0.90</td></tr><tr><td align="left" valign="bottom">Q fever</td><td align="char" char="." valign="bottom">0.78</td><td align="char" char="." valign="bottom">0.78</td><td align="char" char="." valign="bottom">0.64</td><td align="char" char="." valign="bottom">0.79</td><td align="char" char="." valign="bottom">0.78</td><td align="char" char="." valign="bottom">0.67</td><td align="char" char="." valign="bottom">0.74</td><td align="char" char="." valign="bottom">0.65</td><td align="char" char="." valign="bottom">0.78</td></tr><tr><td align="left" valign="bottom">Tick-borne encephalitis</td><td align="char" char="." valign="bottom">0.68</td><td align="char" char="." valign="bottom">0.98</td><td align="char" char="." valign="bottom">0.59</td><td align="char" char="." valign="bottom">0.97</td><td align="char" char="." valign="bottom">0.98</td><td align="char" char="." valign="bottom">0.55</td><td align="char" char="." valign="bottom">0.95</td><td align="char" char="." valign="bottom">0.54</td><td align="char" char="." valign="bottom">0.98</td></tr><tr><td align="left" valign="bottom">Tularemia</td><td align="char" char="." valign="bottom">0.54</td><td align="char" char="." valign="bottom">0.73</td><td align="char" char="." valign="bottom">0.49</td><td align="char" char="." valign="bottom">0.71</td><td align="char" char="." valign="bottom">0.73</td><td align="char" char="." valign="bottom">0.50</td><td align="char" char="." valign="bottom">0.72</td><td align="char" char="." valign="bottom">0.55</td><td align="char" char="." valign="bottom">0.73</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ARIMA: autoregressive integrated moving average.</p></fn><fn id="table3fn2"><p><sup>b</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table3fn3"><p><sup>c</sup>LSTM: long short-term memory.</p></fn><fn id="table3fn4"><p><sup>d</sup>RF: random forest.</p></fn><fn id="table3fn5"><p><sup>e</sup>RNN: recurrent neural network.</p></fn><fn id="table3fn6"><p><sup>f</sup>SARIMAX: seasonal autoregressive integrated moving average with exogenous factors.</p></fn><fn id="table3fn7"><p><sup>g</sup>XGB: extreme gradient boosting.</p></fn><fn id="table3fn8"><p><sup>h</sup>MERS: Middle East respiratory syndrome.</p></fn></table-wrap-foot></table-wrap><p>Next, we assessed the performance of each model for the subset of regions, where the total case counts were greater than 0 (ie, the disease was present) based on MAE. The model with the lowest MAE was inconsistent across diseases (<xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>MAE<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (95% CI) for each disease aggregated across all locations where the disease was present in 2017 and 2018.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Disease</td><td align="left" valign="bottom" colspan="9">Model</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">ARIMA<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">LGBM<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">LSTM<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">Prophet, MAE (95% CI)</td><td align="left" valign="bottom">RF<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">RNN<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">SARIMAX<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup>, MAE (95% CI)</td><td align="left" valign="bottom">Transformer, MAE (95% CI)</td><td align="left" valign="bottom">XGB<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup>, MAE (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="bottom">Brucellosis</td><td align="char" char="." valign="bottom">0.8 (0.5&#x2010;1.1)</td><td align="char" char="." valign="bottom">0.8 (0.5&#x2010;1.1)</td><td align="char" char="." valign="bottom">0.84 (0.5&#x2010;1.14)</td><td align="char" char="." valign="bottom">0.9 (0.5&#x2010;1.2)</td><td align="char" char="." valign="bottom">0.8 (0.5&#x2010;1.1)</td><td align="char" char="." valign="bottom">0.9 (0.5&#x2010;1.2)</td><td align="char" char="." valign="bottom">1.1 (0.7&#x2010;1.6)</td><td align="char" char="." valign="bottom">0.8 (0.5&#x2010;1.6)</td><td align="char" char="." valign="bottom">0.8 (0.4&#x2010;1.1)</td></tr><tr><td align="left" valign="bottom">Campylobacteriosis</td><td align="char" char="." valign="bottom">237.9 (1.1&#x2010;474.9)</td><td align="char" char="." valign="bottom">43.8 (35.3&#x2010;52.3)</td><td align="char" char="." valign="bottom">45.2 (36.3&#x2010;54.12)</td><td align="char" char="." valign="bottom">43.4 (34.9&#x2010;51.8)</td><td align="char" char="." valign="bottom">39.8 (32.3&#x2010;47.2)</td><td align="char" char="." valign="bottom">46.6 (37.7&#x2010;55.5)</td><td align="char" char="." valign="bottom">243.7 (74.9&#x2010;412.6)</td><td align="char" char="." valign="bottom">50.9 (40.3&#x2010;61.6)</td><td align="char" char="." valign="bottom">43.1 (34.2&#x2010;52.1)</td></tr><tr><td align="left" valign="bottom">Q fever</td><td align="char" char="." valign="bottom">28.9 (25.4&#x2010;83.1)</td><td align="char" char="." valign="bottom">1.5 (0.9&#x2010;2.1)</td><td align="char" char="." valign="bottom">1.18 (0.8&#x2010;1.6)</td><td align="char" char="." valign="bottom">1.4 (0.9&#x2010;1.9)</td><td align="char" char="." valign="bottom">1.5 (0.8&#x2010;2.1)</td><td align="char" char="." valign="bottom">1.3 (0.9&#x2010;1.8)</td><td align="char" char="." valign="bottom">1.9 (1.2&#x2010;2.7)</td><td align="char" char="." valign="bottom">1.4 (0.9&#x2010;2.0)</td><td align="char" char="." valign="bottom">1.2 (0.9&#x2010;1.5)</td></tr><tr><td align="left" valign="bottom">Tick-borne encephalitis</td><td align="char" char="." valign="bottom">2.0 (0.6&#x2010;3.3)</td><td align="char" char="." valign="bottom">2.4 (0.7&#x2010;4.1)</td><td align="char" char="." valign="bottom">2.61 (0.7&#x2010;4.53)</td><td align="char" char="." valign="bottom">1.3 (0.5&#x2010;2.2)</td><td align="char" char="." valign="bottom">2.4 (0.6&#x2010;4.1)</td><td align="char" char="." valign="bottom">2.6 (0.7&#x2010;4.6)</td><td align="char" char="." valign="bottom">1.6 (0.6&#x2010;2.6)</td><td align="char" char="." valign="bottom">2.9 (0.7&#x2010;5.2)</td><td align="char" char="." valign="bottom">2.4 (0.6&#x2010;4.1)</td></tr><tr><td align="left" valign="bottom">Tularemia</td><td align="char" char="." valign="bottom">0.6 (0.4&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.6 (0.5&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.58 (0.5&#x2010;0.71)</td><td align="char" char="." valign="bottom">0.6 (0.5&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.6 (0.5&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.6 (0.4&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.7 (0.5&#x2010;0.9)</td><td align="char" char="." valign="bottom">0.6 (0.5&#x2010;0.7)</td><td align="char" char="." valign="bottom">0.6 (0.5&#x2010;0.7)</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>MAE: mean absolute error.</p></fn><fn id="table4fn2"><p><sup>b</sup>ARIMA: autoregressive integrated moving average.</p></fn><fn id="table4fn3"><p><sup>c</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table4fn4"><p><sup>d</sup>LSTM: long short-term memory.</p></fn><fn id="table4fn5"><p><sup>e</sup>RF: random forest.</p></fn><fn id="table4fn6"><p><sup>f</sup>RNN: recurrent neural network.</p></fn><fn id="table4fn7"><p><sup>g</sup>SARIMAX: seasonal autoregressive integrated moving average with exogenous factors.</p></fn><fn id="table4fn8"><p><sup>h</sup>XGB: extreme gradient boosting.</p></fn></table-wrap-foot></table-wrap><p>The MAE of the best-performing model for each disease across all locations (with case counts greater than 0) is presented in <xref ref-type="table" rid="table5">Table 5</xref>, which we define as our &#x201C;ensemble&#x201D; model. Using this technique and when averaging across all regions, prediction years, and diseases, we observed that the ensemble model had the lowest MAE compared to other models (<xref ref-type="table" rid="table6">Table 6</xref>). While the difference does not appear to be a large amount, the difference is considerable, and the magnitude is visually minimized by the large error in the ARIMA and SARIMAX models. All the models included in our study had similar MAE except for ARIMA and SARIMAX since they had a few outlier predictions that skewed their MAE.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Ensemble (best performing) models for each disease averaged across all regions where the disease was present in 2017 and 2018.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Disease</td><td align="left" valign="bottom">Best model</td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="bottom">Brucellosis</td><td align="left" valign="bottom">LGBM<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup></td><td align="char" char="." valign="bottom">0.8 (0.5&#x2010;1.1)</td></tr><tr><td align="left" valign="bottom">Campylobacteriosis</td><td align="left" valign="bottom">RF<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup></td><td align="char" char="." valign="bottom">39.8 (32.3&#x2010;47.2)</td></tr><tr><td align="left" valign="bottom">Q fever</td><td align="left" valign="bottom">LSTM<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup></td><td align="char" char="." valign="bottom">1.2 (0.8&#x2010;1.6)</td></tr><tr><td align="left" valign="bottom">Tick-borne encephalitis</td><td align="left" valign="bottom">Prophet</td><td align="char" char="." valign="bottom">1.4 (0.5&#x2010;2.2)</td></tr><tr><td align="left" valign="bottom">Tularemia</td><td align="left" valign="bottom">ARIMA<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="char" char="." valign="bottom">0.6 (0.4&#x2010;0.7)</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>MAE: mean absolute error.</p></fn><fn id="table5fn2"><p><sup>b</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table5fn3"><p><sup>c</sup>RF: random forest.</p></fn><fn id="table5fn4"><p><sup>d</sup>LSTM: long short-term memory.</p></fn><fn id="table5fn5"><p><sup>e</sup>ARIMA: autoregressive integrated moving average.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>MAE<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup> (95% CIs) for each model aggregated across all diseases and regions where the disease was present in 2017 and 2018.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">MAE (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="bottom">ARIMA<sup><xref ref-type="table-fn" rid="table6fn2">b</xref></sup></td><td align="char" char="." valign="bottom">115.2 (5.2&#x2010;225.2)</td></tr><tr><td align="left" valign="bottom">Ensemble</td><td align="char" char="." valign="bottom">8.7 (6.5&#x2010;23.9)</td></tr><tr><td align="left" valign="bottom">LGBM<sup><xref ref-type="table-fn" rid="table6fn3">c</xref></sup></td><td align="char" char="." valign="bottom">20.8 (16.5&#x2010;25.1)</td></tr><tr><td align="left" valign="bottom">LSTM<sup><xref ref-type="table-fn" rid="table6fn4">d</xref></sup></td><td align="char" char="." valign="bottom">21.4 (16.9&#x2010;25.9)</td></tr><tr><td align="left" valign="bottom">Prophet</td><td align="char" char="." valign="bottom">20.6 (16.3&#x2010;24.9)</td></tr><tr><td align="left" valign="bottom">RF<sup><xref ref-type="table-fn" rid="table6fn5">e</xref></sup></td><td align="char" char="." valign="bottom">19.0 (15.2&#x2010;22.8)</td></tr><tr><td align="left" valign="bottom">RNN<sup><xref ref-type="table-fn" rid="table6fn6">f</xref></sup></td><td align="char" char="." valign="bottom">22.1 (17.6&#x2010;26.7)</td></tr><tr><td align="left" valign="bottom">SARIMAX<sup><xref ref-type="table-fn" rid="table6fn7">g</xref></sup></td><td align="char" char="." valign="bottom">113.1 (34.6&#x2010;191.6)</td></tr><tr><td align="left" valign="bottom">Transformer</td><td align="char" char="." valign="bottom">24.2 (18.8&#x2010;29.5)</td></tr><tr><td align="left" valign="bottom">XGB<sup><xref ref-type="table-fn" rid="table6fn8">h</xref></sup></td><td align="char" char="." valign="bottom">20.5 (16.0&#x2010;25.0)</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>MAE: mean absolute error.</p></fn><fn id="table6fn2"><p><sup>b</sup>ARIMA: autoregressive integrated moving average.</p></fn><fn id="table6fn3"><p><sup>c</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table6fn4"><p><sup>d</sup>LSTM: long short-term memory.</p></fn><fn id="table6fn5"><p><sup>e</sup>RF: random forest.</p></fn><fn id="table6fn6"><p><sup>f</sup>RNN: recurrent neural network.</p></fn><fn id="table6fn7"><p><sup>g</sup>SARIMAX: seasonal autoregressive integrated moving average with exogenous factors.</p></fn><fn id="table6fn8"><p><sup>h</sup>XGB: extreme gradient boosting.</p></fn></table-wrap-foot></table-wrap><p>The average training time, which included hyperparameter tuning and model fitting, along with prediction time (ie, the time to generate 1-step ahead forecasts and their PIs) for each model averaged across all diseases, regions, and periods are presented in <xref ref-type="fig" rid="figure2">Figure 2</xref>. The LGBM followed by ARIMA were the most time-efficient models. Although RF and XGB had a training time comparable with other models, their average prediction time was considerably higher mainly because of the increased amount of time required by them to generate 95% PIs using the bootstrapping technique.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>(A) Average hyperparameter tuning and model fitting time and (B) average training and prediction time for each model averaged across all diseases, locations, and periods. ARIMA: autoregressive integrated moving average; LGBM: light gradient boosting machine; LSTM: long short-term memory; RF: random forest; RNN: recurrent neural network; SARIMAX: seasonal autoregressive integrated moving average with exogenous factors; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e59971_fig02.png"/></fig></sec><sec id="s3-2"><title>Feature Importance</title><p>For the tree-based models (ie, LGBM, RF, and XGB), we selected up to 10 top features based on SHAP values that the model deemed important and calculated feature ratio and MRR to show how lag case count may be impacting our predictive performance (<xref ref-type="fig" rid="figure3">Figure 3</xref>). Overall, the feature ratios were low (&#x003C;0.4) when aggregated across countries and diseases, suggesting that non&#x2013;lag case count features were more important for forecasting compared to case lag data. Campylobacteriosis and tick-borne encephalitis had higher MRR compared to other diseases, indicating that lag case count features were ranked relatively higher among the top 10 features for these diseases. However, the low feature ratio and MRR for many diseases highlight how the additional feature variables can be valuable in disease forecasting, especially for less prevalent diseases. A complete breakdown of feature ratios and MRRs for each country-disease combination is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Relative importance of case count lags to produce forecasts for tree-based models quantified as feature ratios and mean reciprocal ranks of the most important features (up to the top 10) aggregated across countries (top row) and diseases (bottom row). Higher scores signify the greater relative importance of case count lags compared to other features for obtaining model forecasts. LGBM: light gradient boosting machine; MERS: Middle East respiratory syndrome; RF: random forest; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e59971_fig03.png"/></fig><p>The coverage probability of the forecasting models represented by the percent coverage of the true observations by 95% PIs is presented in <xref ref-type="table" rid="table7">Table 7</xref>. The LGBM had a 94.4% (n=14,707) coverage, indicating that the PIs were well calibrated, even better than traditional statistical models like ARIMA and SARIMAX. On the other hand, the DL models had less than 10% coverage, highlighting the fact that these models were not thoroughly calibrated. This observation was true when the coverage percentage was broken down across disease and country combinations in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t7" position="float"><label>Table 7.</label><caption><p>Coverage percentage of the 95% prediction intervals of the forecasting models<sup><xref ref-type="table-fn" rid="table7fn1">a</xref></sup>.</p></caption><table id="table7" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Coverage, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">ARIMA<sup><xref ref-type="table-fn" rid="table7fn2">b</xref></sup></td><td align="left" valign="top">14,582 (93.6)</td></tr><tr><td align="left" valign="top">LGBM<sup><xref ref-type="table-fn" rid="table7fn3">c</xref></sup></td><td align="left" valign="top">14,707 (94.4)</td></tr><tr><td align="left" valign="top">LSTM<sup><xref ref-type="table-fn" rid="table7fn4">d</xref></sup></td><td align="left" valign="top">1277 (8.2)</td></tr><tr><td align="left" valign="top">Prophet</td><td align="left" valign="top">13,086 (84)</td></tr><tr><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table7fn5">e</xref></sup></td><td align="left" valign="top">13,756 (88.3)</td></tr><tr><td align="left" valign="top">RNN<sup><xref ref-type="table-fn" rid="table7fn6">f</xref></sup></td><td align="left" valign="top">1246 (8)</td></tr><tr><td align="left" valign="top">SARIMAX<sup><xref ref-type="table-fn" rid="table7fn7">g</xref></sup></td><td align="left" valign="top">13,959 (89.6)</td></tr><tr><td align="left" valign="top">Transformer</td><td align="left" valign="top">1262 (8.1)</td></tr><tr><td align="left" valign="top">XGB<sup><xref ref-type="table-fn" rid="table7fn8">h</xref></sup></td><td align="left" valign="top">13,491 (86.6)</td></tr></tbody></table><table-wrap-foot><fn id="table7fn1"><p><sup>a</sup>The ideal coverage percentage is 95%.</p></fn><fn id="table7fn2"><p><sup>b</sup>ARIMA: autoregressive integrated moving average.</p></fn><fn id="table7fn3"><p><sup>c</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table7fn4"><p><sup>d</sup>LSTM: long short-term memory.</p></fn><fn id="table7fn5"><p><sup>e</sup>RF: random forest.</p></fn><fn id="table7fn6"><p><sup>f</sup>RNN: recurrent neural network.</p></fn><fn id="table7fn7"><p><sup>g</sup>SARIMAX: seasonal autoregressive integrated moving average with exogenous factors.</p></fn><fn id="table7fn8"><p><sup>h</sup>XGB: extreme gradient boosting.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Results Visualization</title><p>We created an interactable dashboard to visualize the predictions made by forecasting models (<xref ref-type="fig" rid="figure4">Figure 4</xref>). The information presented in the user interface includes a time series of actual and predicted values with 95% PI, model performance metrics, and feature importance values for each disease and country or region. In <xref ref-type="fig" rid="figure5">Figure 5</xref>, campylobacteriosis in Schleswig-Holstein, Germany, for the year 2018 using the LGBM model is presented as an example, showing uncertainty quantification by PIs and feature importance as mean SHAP values. The lagging case count feature for the past 6 periods was the most important feature for the model, but variables related to global health spending and monetary export value of cattle also ranked high in feature importance.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Dashboard in prediction view with values based on case counts scaled by population. LGBM: light gradient boosting machine; MAE: mean absolute error; ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e59971_fig04.png"/></fig><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Dashboard with disease (&#x201C;campy&#x201D;=campylobacteriosis) and region (Schleswig-Holstein, Germany) selected in prediction view, which includes model performance statistics in summary and model feature importance list. Pop-out box provides a detailed explanation of the clicked and highlighted feature. LGBM: light gradient boosting machine; MAE: mean absolute error; ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e59971_fig05.png"/></fig></sec><sec id="s3-4"><title>Spatial Generalizability Using Transfer Learning</title><p>The spatial generalizability for the forecasting models was tested based on the performance of the pretrained ensemble model from the location with a comparable disease pattern (ie, similar region) to forecast the disease case counts of the selected region (ie, target region). The model tested (ensemble or best model) varied by location and included statistical (ARIMA: n=3) and tree-based models (LGBM: n=2 and XGB: n=1). In most cases, the MAE of a similar region was close to and often lower than the MAE of the target region (<xref ref-type="table" rid="table8">Table 8</xref>). However, campylobacteriosis forecasting in Kalmar, Sweden, was an exception, where the model MAE increased from 5.01 to 16.98 when V&#x00E4;stmanland feature data were used for training. It is important to note that these are pairwise comparisons of a single metric calculated across a single region and do not include confidence bounds to determine if any differences are statistically significant. However, given that over half of the disease-region models produced an equal or lower MAE when testing in a new region, if a power analysis was conducted assuming a binary outcome and a continued trend, no amount of data would be sufficient to show that the transfer learning results would be significantly worse.</p><table-wrap id="t8" position="float"><label>Table 8.</label><caption><p>The mean absolute error (MAE) values representing spatial generalizability of transfer learning models<sup><xref ref-type="table-fn" rid="table8fn1">a</xref></sup>.</p></caption><table id="table8" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Disease</td><td align="left" valign="top">Country</td><td align="left" valign="top">Target region<break/>(cases in the past 6 months)</td><td align="left" valign="top">Ensemble model</td><td align="left" valign="top">Similar region<break/>(cases in the past 6 months)</td><td align="left" valign="top">MAE of<break/>baseline forecast</td><td align="left" valign="top">MAE of<break/>transfer learning forecast</td></tr></thead><tbody><tr><td align="left" valign="top">Brucellosis</td><td align="left" valign="top">Israel</td><td align="left" valign="top">Jerusalem (34)</td><td align="left" valign="top">LGBM<sup><xref ref-type="table-fn" rid="table8fn2">b</xref></sup></td><td align="left" valign="top">Akko (32)</td><td align="left" valign="top">5.41</td><td align="left" valign="top">2.3</td></tr><tr><td align="left" valign="top">Campylobacteriosis</td><td align="left" valign="top">Sweden</td><td align="left" valign="top">Kalmar (122)</td><td align="left" valign="top">XGB<sup><xref ref-type="table-fn" rid="table8fn3">c</xref></sup></td><td align="left" valign="top">V&#x00E4;stmanland (124)</td><td align="left" valign="top">5.01</td><td align="left" valign="top">16.98</td></tr><tr><td align="left" valign="top">MERS<sup><xref ref-type="table-fn" rid="table8fn4">d</xref></sup></td><td align="left" valign="top">Saudi Arabia</td><td align="left" valign="top">Bisha (0)</td><td align="left" valign="top">ARIMA<sup><xref ref-type="table-fn" rid="table8fn5">e</xref></sup></td><td align="left" valign="top">Eastern Province (0)</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Q fever</td><td align="left" valign="top">Australia</td><td align="left" valign="top">New South Wales (37)</td><td align="left" valign="top">ARIMA</td><td align="left" valign="top">Queensland (48)</td><td align="left" valign="top">2.85</td><td align="left" valign="top">2.00</td></tr><tr><td align="left" valign="top">Tick-borne encephalitis</td><td align="left" valign="top">Germany</td><td align="left" valign="top">Saxony-Anhalt<break/>(3)</td><td align="left" valign="top">ARIMA</td><td align="left" valign="top">Brandenburg (3)</td><td align="left" valign="top">0.20</td><td align="left" valign="top">0.25</td></tr><tr><td align="left" valign="top">Tularemia</td><td align="left" valign="top">Japan</td><td align="left" valign="top">Ibaraki (0)</td><td align="left" valign="top">LGBM</td><td align="left" valign="top">Saga (0)</td><td align="left" valign="top">0.00</td><td align="left" valign="top">0.00</td></tr></tbody></table><table-wrap-foot><fn id="table8fn1"><p><sup>a</sup>For baseline forecasts, the models were trained and tested on target regions. For transfer learning forecasts, the models were trained on similar regions and tested on target regions.</p></fn><fn id="table8fn2"><p><sup>b</sup>LGBM: light gradient boosting machine.</p></fn><fn id="table8fn3"><p><sup>c</sup>XGB: extreme gradient boosting.</p></fn><fn id="table8fn4"><p><sup>d</sup>MERS: Middle East respiratory syndrome.</p></fn><fn id="table8fn5"><p><sup>e</sup>ARIMA: autoregressive integrated moving average.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>As ML and DL techniques gain popularity in the ID forecasting domain, they are being extensively used across a wide range of pathogens with diverse ecology, geographic, and temporal scales. However, there is limited consensus among the forecasting community regarding the application and reporting of these results in a manner that lends themselves useful for operational decision-making in real-world circumstances [<xref ref-type="bibr" rid="ref9">9</xref>]. In this study, we present a universal pipeline for analyzing data, generalizing the results, and automating reporting. We also address crucial operational metrics such as forecasting accuracy, computational efficiency, spatiotemporal generalizability, uncertainty quantification, and interpretability, which are essential in an operational scenario. This generalized and automated analytic pipeline is a major step toward addressing operational demands in the ID forecasting domain and to better inform public health and veterinary policies. We included 6 IDs with diverse transmission dynamics spanning 8 countries and 213 regions. Additionally, we trained our models using a broad range of data from demographic, geographic, climatic, and socioeconomic factors within the One Health landscape. This comprehensive approach enables our analysis to capture the intricate interplay of variables that drive infectious disease presence and transmission, more closely reflecting the complex realities observed in the real world.</p></sec><sec id="s4-2"><title>Model Performance</title><p>We assessed forecasting model accuracies by their ability to detect the presence of a disease based on <italic>F</italic><sub>1</sub>-scores and by their ability to accurately forecast case counts when present using MAE. This 2-step approach prevented the inflation of model accuracy by the regions that did not encounter disease presence during our study period. Though we did not find a single best model suitable for all disease, region, and country combinations, the tree-based models were consistently better than all other models at detecting both disease presence and actual case counts with better <italic>F</italic><sub>1</sub>-scores and MAE values, respectively. Our ensemble technique, which selects the best-performing model for each disease-location pair, demonstrates superior forecasting performance by reducing prediction noise compared to single-model approaches, aligning with previous research [<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. While ideal ensemble methods would dynamically update to identify the best model at each time stamp, this demands extensive data, computational resources, and continuous validation. To address these challenges, we opted for a simpler approach by selecting the best model based on MAE for the testing dataset, minimizing resource and data requirements. However, ensemble techniques still require substantial computational power and analytic pipelines, posing challenges for low- and middle-income countries with limited resources. Investments in infrastructure, skill development, and data-sharing initiatives are crucial to fully leverage ML and DL techniques for ID forecasting in such settings.</p></sec><sec id="s4-3"><title>Computational Efficiency</title><p>The computation time required for ID forecasting can broadly be split into model training and model prediction time. In our analysis, much of the training time was spent on hyperparameter tuning. Autoregressive and tree-based models took less time to tune than DL models. On the other hand, tree-based models (ie, RF and XGB) took considerably longer to produce predictions compared to the other models. This increase in time was mainly because of the time required to compute bootstrap PIs. The LGBM was an exception, as it used the least computational time for both training and testing compared to all the other models. Since our forecasting pipeline performed stepwise forecasting for each month with models retrained only once a year, more time was spent on predicting rather than model training. Hence, when building a forecasting pipeline where the models are retrained once a year and predictions are made every month, it is computationally optimal to choose models with lower prediction time rather than training time.</p><p>The accuracy of modeling techniques can drastically differ with the amount of time and computational resources spent on fine-tuning the model. Here, we chose the initial hyperparameter values for optimization based on their relative importance and time required for overall analysis with the goal of achieving comparable results. It is important to find a balance between model complexity and computational efficiency according to the individual operational needs and available resources.</p></sec><sec id="s4-4"><title>Uncertainty Quantification</title><p>Since the effectiveness of health policies and operational decision-making is driven by the accuracy of forecasts, policy makers need to know the credibility of the models in the form of prediction uncertainties [<xref ref-type="bibr" rid="ref38">38</xref>]. In traditional statistical techniques, such as ARIMA and SARIMAX, forecasting uncertainties are computed based on probability theory and a set of statistical assumptions and, therefore, are readily available. However, generating such PIs is rather complicated in ML and DL compared to traditional methods due to additional uncertainties associated with noise distributions, hyperparameters, overparameterization, and optimization that should be accounted for [<xref ref-type="bibr" rid="ref39">39</xref>]. Therefore, most of the ID forecasting studies fail to report their model uncertainty despite their recent popularity [<xref ref-type="bibr" rid="ref9">9</xref>]. In our study, we used bootstrapping and probabilistic methods to compute PIs around our point estimates of ML and DL methods. Such bounds are crucial to assessing future uncertainties, making operational decisions, planning policies for a range of possible outcomes, and comparing different forecast models thoroughly [<xref ref-type="bibr" rid="ref40">40</xref>]. The LGBM was the best-calibrated model with almost 95% of true observations covered by 95% of PIs, followed by other tree-based and statistical models. The DL models had the least desirable coverage along with their inferior predictive performance and narrow prediction band. This may not be surprising, though as there is evidence in the literature that uncertainty estimates around DL predictions often fail to capture the true data distribution [<xref ref-type="bibr" rid="ref41">41</xref>].</p></sec><sec id="s4-5"><title>Spatiotemporal Generalizability</title><p>Overall, the predictive performance of transfer learning models was comparable to their base models as presented in <xref ref-type="table" rid="table8">Table 8</xref>. For example, using the Akko model to predict case counts of brucellosis in Jerusalem created an increase in predictive accuracy. This suggests the potential for spatial generalizability of our ensemble, that is, an ability to predict existing diseases in new regions with low error. However, campylobacteriosis forecasting in Kalmar, Sweden, was an exception, where the model MAE increased when V&#x00E4;stmanland feature data were used for training. Since campylobacteriosis tends to have higher case counts, the difference in MAE cannot be directly comparable to the other diseases with much lower case counts and naturally lower MAE values. There are many possible reasons for the difference seen in the results. For example, the similar region model may not have contained the necessary similarities to the target region required to enable a lower prediction error, such as differences in regional management practices. The ensemble model (best-performing model for disease-location pair) was different between the test cases and included both statistical (only case counts) and tree-based (many features) models. More advanced transfer learning techniques that include multiple input features to identify similarity and emphasize model retraining by reallocating model weights between target and similar regions could be considered to improve spatial generalizability [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Regardless, these results are encouraging, and a more comprehensive study is warranted.</p></sec><sec id="s4-6"><title>Model Interpretability</title><p>We included interpretability for each model in the form of feature importance, a critical metric that is often neglected in the ID forecasting domain [<xref ref-type="bibr" rid="ref9">9</xref>]. Interpretability provides insight into the decision-making process of the prediction systems, which is crucial for implementing appropriate disease mitigation strategies. Our scoping systematic review of ID prediction models showed that historic case counts are the most commonly used input feature in the ID forecasting domain, while the other important predictors, such as climate, demographics, socioeconomics, and geography, are often neglected [<xref ref-type="bibr" rid="ref9">9</xref>]. In this study, we estimated lower feature ratio and MRR for lag case count features across countries and diseases, indicating that the non&#x2013;case count features were equally important, if not more, compared to case count lags. This study suggests that including data related to the full disease ecology is critical for obtaining accurate, reliable, and interpretable ID forecasts. For example, cattle export was one of the important informative non&#x2013;case count features for forecasting campylobacteriosis in Schleswig-Holstein, Germany. A direct causal association between the disease and cattle exports cannot be made just by a feature importance plot. However, campylobacteriosis is the most commonly reported bacterial food-borne gastrointestinal infection in the European Union that is closely associated with the dairy industry [<xref ref-type="bibr" rid="ref43">43</xref>]. Our results suggest that high dairy and other agriculture activities, including cattle trading in Schleswig-Holstein, could play an important role in the disease prevalence in the region and, if adjusted, could result in disease mitigation.</p></sec><sec id="s4-7"><title>Data Visualization</title><p>To make the best-performing models and corresponding predictions accessible to decision makers, we developed an interactive data visualization dashboard. This dashboard provides the raw data, the model predictions with accompanying 95% PIs and feature importance, overall model performance, and an interactive global map. This dashboard allows a user to visualize forecasts for up to a year into the future in any country or region where the data exist and can be used to inform control measures to reduce the spread of an ID within a country or region.</p></sec><sec id="s4-8"><title>Conclusions</title><p>Our study provides a generalized platform to analyze and report ID forecasts with an emphasis on analytical accuracy, computational efficiency, uncertainty quantification, interpretability, and generalizability. These 5 aspects are crucial in determining the forecasting approach optimal for each situation&#x2019;s operational needs. While all the forecasting techniques come with their own strengths and weaknesses, choosing an optimal approach is usually a tradeoff between computational efficiency, model complexity, and forecasting accuracy. Recognizing and addressing such nuances will facilitate the use of ID forecasts in an operational environment for better preparedness and response during an ID emergency.</p></sec></sec></body><back><ack><p>This work was funded by the Defense Threat Reduction Agency (project CB11029).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are publicly available with website links in the Methods section, including <xref ref-type="table" rid="table1">Table 1</xref>.</p></sec></notes><fn-group><fn fn-type="con"><p>LEC and KTP acquired the funding. RK, KTP, SD, SE, and LEC conceptualized and designed the study. RK, CH, SD, and SE analyzed the data. RK, CH, and KTP created visualizations. RK drafted the manuscript. RK, KTP, CH, and LEC reviewed and edited the manuscript. All authors agreed to the published version of the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ARIMA</term><def><p>autoregressive integrated moving average</p></def></def-item><def-item><term id="abb2">DL</term><def><p>deep learning</p></def></def-item><def-item><term id="abb3">ID</term><def><p>infectious disease</p></def></def-item><def-item><term id="abb4">LASSO</term><def><p>least absolute shrinkage and selection operator</p></def></def-item><def-item><term id="abb5">LGBM</term><def><p>light gradient boosting machine</p></def></def-item><def-item><term id="abb6">LSTM</term><def><p>long short-term memory</p></def></def-item><def-item><term id="abb7">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb8">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb9">MRR</term><def><p>mean reciprocal rank</p></def></def-item><def-item><term id="abb10">PI</term><def><p>prediction interval</p></def></def-item><def-item><term id="abb11">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb12">RNN</term><def><p>recurrent neural network</p></def></def-item><def-item><term id="abb13">SARIMAX</term><def><p>seasonal autoregressive integrated moving average with exogenous factors</p></def></def-item><def-item><term id="abb14">SHAP</term><def><p>Shapley Additive Explanation</p></def></def-item><def-item><term id="abb15">XGB</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bloom</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Buckeridge</surname><given-names>DL</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>KE</given-names> </name></person-group><article-title>Finding leading indicators for disease outbreaks: filtering, cross-correlation, and caveats</article-title><source>J Am Med Inform Assoc</source><year>2007</year><volume>14</volume><issue>1</issue><fpage>76</fpage><lpage>85</lpage><pub-id pub-id-type="doi">10.1197/jamia.M2178</pub-id><pub-id pub-id-type="medline">17068353</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Keshavamurthy</surname><given-names>R</given-names> </name><name name-style="western"><surname>Charles</surname><given-names>LE</given-names> </name></person-group><article-title>Predicting Kyasanur forest disease in resource-limited settings using event-based surveillance and transfer learning</article-title><source>Sci Rep</source><year>2023</year><month>07</month><day>8</day><volume>13</volume><issue>1</issue><fpage>11067</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-38074-0</pub-id><pub-id pub-id-type="medline">37422454</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Woolhouse</surname><given-names>M</given-names> </name></person-group><article-title>How to make predictions about future infectious disease risks</article-title><source>Philos Trans R Soc Lond B Biol Sci</source><year>2011</year><month>07</month><day>12</day><volume>366</volume><issue>1573</issue><fpage>2045</fpage><lpage>2054</lpage><pub-id pub-id-type="doi">10.1098/rstb.2010.0387</pub-id><pub-id pub-id-type="medline">21624924</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bansal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chowell</surname><given-names>G</given-names> </name><name name-style="western"><surname>Simonsen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Vespignani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Viboud</surname><given-names>C</given-names> </name></person-group><article-title>Big data for infectious disease surveillance and modeling</article-title><source>J Infect Dis</source><year>2016</year><month>12</month><day>1</day><volume>214</volume><issue>Suppl 4</issue><fpage>S375</fpage><lpage>S379</lpage><pub-id pub-id-type="doi">10.1093/infdis/jiw400</pub-id><pub-id pub-id-type="medline">28830113</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dixon</surname><given-names>S</given-names> </name><name name-style="western"><surname>Keshavamurthy</surname><given-names>R</given-names> </name><name name-style="western"><surname>Farber</surname><given-names>DH</given-names> </name><name name-style="western"><surname>Stevens</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pazdernik</surname><given-names>KT</given-names> </name><name name-style="western"><surname>Charles</surname><given-names>LE</given-names> </name></person-group><article-title>A comparison of infectious disease forecasting methods across locations, diseases, and time</article-title><source>Pathogens</source><year>2022</year><month>01</month><day>29</day><volume>11</volume><issue>2</issue><fpage>185</fpage><pub-id pub-id-type="doi">10.3390/pathogens11020185</pub-id><pub-id pub-id-type="medline">35215129</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Predicting the spatial-temporal distribution of human brucellosis in Europe based on convolutional long short-term memory network</article-title><source>Can J Infect Dis Med Microbiol</source><year>2022</year><volume>2022</volume><fpage>7658880</fpage><pub-id pub-id-type="doi">10.1155/2022/7658880</pub-id><pub-id pub-id-type="medline">35967090</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Da&#x2019;ar</surname><given-names>OB</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>AE</given-names> </name></person-group><article-title>Underlying trend, seasonality, prediction, forecasting and the contribution of risk factors: an analysis of globally reported cases of Middle East Respiratory Syndrome Coronavirus</article-title><source>Epidemiol Infect</source><year>2018</year><month>08</month><volume>146</volume><issue>11</issue><fpage>1343</fpage><lpage>1349</lpage><pub-id pub-id-type="doi">10.1017/S0950268818001541</pub-id><pub-id pub-id-type="medline">29886854</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adnan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Bai</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Potential early identification of a large Campylobacter outbreak using alternative surveillance data sources: autoregressive modelling and spatiotemporal clustering</article-title><source>JMIR Public Health Surveill</source><year>2020</year><month>09</month><day>17</day><volume>6</volume><issue>3</issue><fpage>e18281</fpage><pub-id pub-id-type="doi">10.2196/18281</pub-id><pub-id pub-id-type="medline">32940617</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Keshavamurthy</surname><given-names>R</given-names> </name><name name-style="western"><surname>Dixon</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pazdernik</surname><given-names>KT</given-names> </name><name name-style="western"><surname>Charles</surname><given-names>LE</given-names> </name></person-group><article-title>Predicting infectious disease for biopreparedness and response: a systematic review of machine learning and deep learning approaches</article-title><source>One Health</source><year>2022</year><month>12</month><volume>15</volume><fpage>100439</fpage><pub-id pub-id-type="doi">10.1016/j.onehlt.2022.100439</pub-id><pub-id pub-id-type="medline">36277100</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chae</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kwon</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>D</given-names> </name></person-group><article-title>Predicting infectious disease using deep learning and big data</article-title><source>Int J Environ Res Public Health</source><year>2018</year><month>07</month><day>27</day><volume>15</volume><issue>8</issue><fpage>1596</fpage><pub-id pub-id-type="doi">10.3390/ijerph15081596</pub-id><pub-id pub-id-type="medline">30060525</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oidtman</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Omodei</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kraemer</surname><given-names>MUG</given-names> </name><etal/></person-group><article-title>Trade-offs between individual and ensemble forecasts of an emerging infectious disease</article-title><source>Nat Commun</source><year>2021</year><month>09</month><day>10</day><volume>12</volume><issue>1</issue><fpage>5379</fpage><pub-id pub-id-type="doi">10.1038/s41467-021-25695-0</pub-id><pub-id pub-id-type="medline">34508077</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reich</surname><given-names>NG</given-names> </name><name name-style="western"><surname>McGowan</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Yamana</surname><given-names>TK</given-names> </name><etal/></person-group><article-title>Accuracy of real-time multi-model ensemble forecasts for seasonal influenza in the U.S</article-title><source>PLOS Comput Biol</source><year>2019</year><month>11</month><volume>15</volume><issue>11</issue><fpage>e1007486</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1007486</pub-id><pub-id pub-id-type="medline">31756193</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ma</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ning</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name></person-group><article-title>Joint COVID-19 and influenza-like illness forecasts in the United States using internet search information</article-title><source>Commun Med (Lond)</source><year>2023</year><month>03</month><day>24</day><volume>3</volume><issue>1</issue><fpage>39</fpage><pub-id pub-id-type="doi">10.1038/s43856-023-00272-2</pub-id><pub-id pub-id-type="medline">36964311</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Jarrah</surname><given-names>OY</given-names> </name><name name-style="western"><surname>Yoo</surname><given-names>PD</given-names> </name><name name-style="western"><surname>Muhaidat</surname><given-names>S</given-names> </name><name name-style="western"><surname>Karagiannidis</surname><given-names>GK</given-names> </name><name name-style="western"><surname>Taha</surname><given-names>K</given-names> </name></person-group><article-title>Efficient machine learning for big data: a review</article-title><source>Big Data Research</source><year>2015</year><month>09</month><volume>2</volume><issue>3</issue><fpage>87</fpage><lpage>93</lpage><pub-id pub-id-type="doi">10.1016/j.bdr.2015.04.001</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Bhatt</surname><given-names>U</given-names> </name><name name-style="western"><surname>Antor&#x00E1;n</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Uncertainty as a form of transparency: measuring, communicating, and using uncertainty</article-title><conf-name>Proceedings of the 2021 AAAI/ACM Conference on AI, Ethics, and Society</conf-name><conf-date>May 19-21, 2021</conf-date><conf-loc>Virtual Event, United States</conf-loc><fpage>401</fpage><lpage>413</lpage><pub-id pub-id-type="doi">10.1145/3461702.3462571</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Generous</surname><given-names>N</given-names> </name><name name-style="western"><surname>Fairchild</surname><given-names>G</given-names> </name><name name-style="western"><surname>Khalsa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Tasseff</surname><given-names>B</given-names> </name><name name-style="western"><surname>Arnold</surname><given-names>J</given-names> </name></person-group><article-title>Epi Archive: automated data collection of notifiable disease data</article-title><source>OJPHI</source><year>2017</year><month>05</month><day>2</day><volume>9</volume><issue>1</issue><pub-id pub-id-type="doi">10.5210/ojphi.v9i1.7615</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Welte</surname><given-names>VR</given-names> </name><name name-style="western"><surname>Vargas Ter&#x00E1;n</surname><given-names>M</given-names> </name></person-group><article-title>Emergency Prevention System (EMPRES) for transboundary animal and plant pests and diseases. The EMPRES-livestock: an FAO initiative</article-title><source>Ann N Y Acad Sci</source><year>2004</year><month>10</month><volume>1026</volume><fpage>19</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.1196/annals.1307.003</pub-id><pub-id pub-id-type="medline">15604466</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><source>GADM</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://gadm.org/">https://gadm.org/</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><source>GES DISC</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://disc.gsfc.nasa.gov/">https://disc.gsfc.nasa.gov/</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><article-title>Earth Science Data Systems</article-title><source>NASA</source><year>2024</year><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.earthdata.nasa.gov/">https://www.earthdata.nasa.gov/</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><source>US Department of Agriculture. Economic Research Service&#x2014;Home</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ers.usda.gov/">https://www.ers.usda.gov/</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="web"><source>DIVA-GIS | free, simple &#x0026; effective</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://diva-gis.org/">https://diva-gis.org/</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="web"><article-title>World Health Organization (WHO)</article-title><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int">https://www.who.int</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><article-title>OECD Statistics</article-title><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://stats.oecd.org/">https://stats.oecd.org/</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="web"><source>Natural Earth. Free vector and raster map data at 1:10m, 1:50m, and 1:110m scales</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.naturalearthdata.com/">https://www.naturalearthdata.com/</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><article-title>Population division</article-title><source>United Nations</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.un.org/development/desa/pd/">https://www.un.org/development/desa/pd/</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><article-title>SEDAC: Socioeconomic Data and Applications Center</article-title><source>NASA</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://sedac.ciesin.columbia.edu/">https://sedac.ciesin.columbia.edu/</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Josef</surname><given-names>P</given-names> </name><name name-style="western"><surname>Skipper</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kevin</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Statsmodels: econometric and statistical modeling with python</article-title><year>2010</year><access-date>2025-02-28</access-date><conf-name>Proceedings of the 9th Python in Science Conference</conf-name><conf-loc>Texas, US</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://www.statsmodels.org/">https://www.statsmodels.org/</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><source>scikit-learn: machine learning in Python</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/stable/">https://scikit-learn.org/stable/</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taylor</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Letham</surname><given-names>B</given-names> </name></person-group><article-title>Forecasting at scale</article-title><source>PeerJ Preprints</source><year>2017</year><month>09</month><volume>5</volume><fpage>e3190v2</fpage><pub-id pub-id-type="doi">10.7287/peerj.preprints.3190</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>Darts: time series made easy in Python</article-title><source>Unit8</source><access-date>2024-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://unit8.com/resources/darts-time-series-made-easy-in-python/">https://unit8.com/resources/darts-time-series-made-easy-in-python/</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Amat Rodrigo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Escobar Ortiz</surname><given-names>J</given-names> </name></person-group><article-title>Skforecast</article-title><source>Zenodo</source><year>2024</year><access-date>2025-02-28</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://zenodo.org/records/8382788">https://zenodo.org/records/8382788</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Vaswani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shazeer</surname><given-names>N</given-names> </name><name name-style="western"><surname>Parmar</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Attention is all you need</article-title><conf-name>Advances in Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>California, United States</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2017/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html">https://proceedings.neurips.cc/paper_files/paper/2017/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="web"><article-title>Topical overviews</article-title><source>SHAP Latest Documentation</source><access-date>2024-03-02</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://shap.readthedocs.io/en/latest/overviews.html">https://shap.readthedocs.io/en/latest/overviews.html</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alfred</surname><given-names>R</given-names> </name><name name-style="western"><surname>Obit</surname><given-names>JH</given-names> </name></person-group><article-title>The roles of machine learning methods in limiting the spread of deadly diseases: a systematic review</article-title><source>Heliyon</source><year>2021</year><month>06</month><volume>7</volume><issue>6</issue><fpage>e07371</fpage><pub-id pub-id-type="doi">10.1016/j.heliyon.2021.e07371</pub-id><pub-id pub-id-type="medline">34179541</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khan</surname><given-names>SD</given-names> </name><name name-style="western"><surname>Alarabi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Basalamah</surname><given-names>S</given-names> </name></person-group><article-title>Toward smart lockdown: a novel approach for COVID-19 hotspots prediction using a deep hybrid neural network</article-title><source>Computers</source><year>2020</year><volume>9</volume><issue>4</issue><fpage>99</fpage><pub-id pub-id-type="doi">10.3390/computers9040099</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kasilingam</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sathiya Prabhakaran</surname><given-names>SP</given-names> </name><name name-style="western"><surname>Rajendran</surname><given-names>DK</given-names> </name><name name-style="western"><surname>Rajagopal</surname><given-names>V</given-names> </name><name name-style="western"><surname>Santhosh Kumar</surname><given-names>T</given-names> </name><name name-style="western"><surname>Soundararaj</surname><given-names>A</given-names> </name></person-group><article-title>Exploring the growth of COVID-19 cases using exponential modelling across 42 countries and predicting signs of early containment using machine learning</article-title><source>Transbound Emerg Dis</source><year>2021</year><month>05</month><volume>68</volume><issue>3</issue><fpage>1001</fpage><lpage>1018</lpage><pub-id pub-id-type="doi">10.1111/tbed.13764</pub-id><pub-id pub-id-type="medline">32749759</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gilbert</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Meyers</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Galvani</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Townsend</surname><given-names>JP</given-names> </name></person-group><article-title>Probabilistic uncertainty analysis of epidemiological modeling to guide public health intervention policy</article-title><source>Epidemics</source><year>2014</year><month>03</month><volume>6</volume><fpage>37</fpage><lpage>45</lpage><pub-id pub-id-type="doi">10.1016/j.epidem.2013.11.002</pub-id><pub-id pub-id-type="medline">24593920</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Psaros</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Karniadakis</surname><given-names>GE</given-names> </name></person-group><article-title>Uncertainty quantification in scientific machine learning: methods, metrics, and comparisons</article-title><source>J Comput Phys</source><year>2023</year><month>03</month><volume>477</volume><fpage>111902</fpage><pub-id pub-id-type="doi">10.1016/j.jcp.2022.111902</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Chatfield</surname><given-names>C</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Armstrong</surname><given-names>JS</given-names> </name></person-group><article-title>Prediction intervals for time-series forecasting</article-title><source>Principles of Forecasting: A Handbook for Researchers and Practitioners</source><year>2001</year><publisher-name>Springer</publisher-name><fpage>475</fpage><lpage>494</lpage><pub-id pub-id-type="doi">10.1007/978-0-306-47630-3_21ISBN:978-0-306-47630-3</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lakshminarayanan</surname><given-names>B</given-names> </name><name name-style="western"><surname>Pritzel</surname><given-names>A</given-names> </name><name name-style="western"><surname>Blundell</surname><given-names>C</given-names> </name></person-group><article-title>Simple and scalable predictive uncertainty estimation using deep ensembles</article-title><access-date>2025-02-28</access-date><conf-name>Advances in Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>California, United States</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2017/hash/9ef2ed4b7fd2c810847ffa5fa85bce38-Abstract.html">https://proceedings.neurips.cc/paper_files/paper/2017/hash/9ef2ed4b7fd2c810847ffa5fa85bce38-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roster</surname><given-names>K</given-names> </name><name name-style="western"><surname>Connaughton</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rodrigues</surname><given-names>FA</given-names> </name></person-group><article-title>Forecasting new diseases in low-data settings using transfer learning</article-title><source>Chaos Solitons Fractals</source><year>2022</year><month>08</month><volume>161</volume><fpage>112306</fpage><pub-id pub-id-type="doi">10.1016/j.chaos.2022.112306</pub-id><pub-id pub-id-type="medline">35765601</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Henningsen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Henning</surname><given-names>C</given-names> </name><name name-style="western"><surname>Struve</surname><given-names>C</given-names> </name><name name-style="western"><surname>Mueller-Scheessel</surname><given-names>J</given-names> </name></person-group><article-title>Economic impact of the mid-term review on agricultural production, farm income and farm survival: a quantitative analysis for local sub-regions of Schleswig-Holstein in Germany</article-title><conf-name>2005 International Congress</conf-name><conf-date>Aug 23-27, 2005</conf-date><conf-loc>Copenhagen, Denmark</conf-loc><pub-id pub-id-type="doi">10.22004/ag.econ.24644</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Supplementary figures and tables.</p><media xlink:href="publichealth_v11i1e59971_app1.docx" xlink:title="DOCX File, 395 KB"/></supplementary-material></app-group></back></article>