<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id><journal-id journal-id-type="publisher-id">publichealth</journal-id><journal-id journal-id-type="index">9</journal-id><journal-title>JMIR Public Health and Surveillance</journal-title><abbrev-journal-title>JMIR Public Health Surveill</abbrev-journal-title><issn pub-type="epub">2369-2960</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e86495</article-id><article-id pub-id-type="doi">10.2196/86495</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predicting Tuberculosis Outcomes Using Routine Surveillance Data in Chiang Mai, Thailand: Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Saksaen</surname><given-names>Porramat</given-names></name><degrees>MNS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Boonchieng</surname><given-names>Ekkarat</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Thongprachum</surname><given-names>Aksara</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Maotheuak</surname><given-names>Surasak</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chautrakarn</surname><given-names>Sineenart</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Boonchieng</surname><given-names>Waraporn</given-names></name><degrees>DrPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Faculty of Public Health, Chiang Mai University</institution><addr-line>239 Huay Kaew Road, Muang District</addr-line><addr-line>Chiang Mai</addr-line><country>Thailand</country></aff><aff id="aff2"><institution>Faculty of Science, Department of Computer Science, Chiang Mai University</institution><addr-line>Chiang Mai</addr-line><country>Thailand</country></aff><aff id="aff3"><institution>Faculty of Education, Department of Curriculum, Teaching &#x0026; Learning, Chiang Mai University</institution><addr-line>Chiang Mai</addr-line><country>Thailand</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Sanchez</surname><given-names>Travis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Girma</surname><given-names>Abayeneh</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Owusu</surname><given-names>Benjamin Atta</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Lau</surname><given-names>Eric</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Celik</surname><given-names>Ilhami</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Waraporn Boonchieng, DrPH, Faculty of Public Health, Chiang Mai University, 239 Huay Kaew Road, Muang District, Chiang Mai, 50200, Thailand, 66 53 942525; <email>waraporn.b@cmu.ac.th</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>25</day><month>6</month><year>2026</year></pub-date><volume>12</volume><elocation-id>e86495</elocation-id><history><date date-type="received"><day>25</day><month>10</month><year>2025</year></date><date date-type="rev-recd"><day>03</day><month>05</month><year>2026</year></date><date date-type="accepted"><day>30</day><month>05</month><year>2026</year></date></history><copyright-statement>&#x00A9; Porramat Saksaen, Ekkarat Boonchieng, Aksara Thongprachum, Surasak Maotheuak, Sineenart Chautrakarn, Waraporn Boonchieng. Originally published in JMIR Public Health and Surveillance (<ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>), 25.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://publichealth.jmir.org/2026/1/e86495"/><abstract><sec><title>Background</title><p>Tuberculosis (TB) remains one of the leading causes of death from a single infectious disease worldwide. In Thailand, persistent gaps in early detection and access to TB care remain important public health challenges, particularly among populations in rural and remote areas.</p></sec><sec><title>Objective</title><p>This study aimed to develop and evaluate predictive models for TB outcomes using routine surveillance data to support risk stratification, thereby informing public health decision-making in Chiang Mai Province, Thailand.</p></sec><sec sec-type="methods"><title>Methods</title><p>A retrospective cohort study was conducted using data from 5557 TB cases registered in the National Tuberculosis Information Program in Chiang Mai Province from 2020 to 2024. Models were developed to predict treatment success, mortality, and time to treatment initiation. We evaluated model performance using the area under the receiver operating characteristic curve, the Harrell Concordance Index, and error-based metrics for time-to-treatment prediction. Scenario analyses were conducted under predefined assumptions to assess projected changes in detection-related indicators, treatment coverage, and mortality relative to provincial baseline indicators.</p></sec><sec sec-type="results"><title>Results</title><p>The models demonstrated good predictive performance. Mortality was associated with HIV co-infection (hazard ratio 5.80) and was highest among older adults with HIV co-infection (hazard ratio 12.30). Treatment delays were longer among individuals living in rural or remote areas and among those without health insurance, with mean delays ranging from 8 to 18 days. These findings suggest distinct patterns in TB outcomes, with mortality more closely related to clinical vulnerability and treatment delay more closely related to health care access factors. Under modeled scenarios, the models projected that detection-related indicators would increase by 25%, treatment coverage would increase by 15%, and mortality would decrease by 20% relative to provincial baseline conditions.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Predictive modeling using routine TB surveillance data may support risk stratification and provide insights into treatment outcomes and delays. The findings highlight the combined roles of clinical vulnerability and health care access factors in TB outcomes and support further evaluation of data-driven approaches to inform targeted TB interventions in resource-limited settings.</p></sec></abstract><kwd-group><kwd>tuberculosis</kwd><kwd>predictive modeling</kwd><kwd>treatment delay</kwd><kwd>mortality</kwd><kwd>health equity</kwd><kwd>resource-limited settings</kwd><kwd>sustainable development goals</kwd><kwd>SDG</kwd><kwd>SDG 3</kwd><kwd>SDG 10</kwd><kwd>Thailand</kwd><kwd>good health and well-being</kwd><kwd>reduced inequalities</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Tuberculosis (TB) remains one of the leading causes of death from a single infectious disease worldwide. The World Health Organization (WHO) estimates that 10.7 million people developed TB globally in 2024, of whom 8.3 million were diagnosed and notified, highlighting persistent gaps in case detection and reporting. Although global health efforts have made progress in TB diagnosis and treatment, global TB incidence declined by approximately 12% between 2015 and 2024, remaining well below the End TB Strategy target of a 50% reduction by 2025 [<xref ref-type="bibr" rid="ref1">1</xref>].</p><p>Thailand is classified as a high-burden country for TB and TB/HIV by the WHO. Thailand has an estimated 113,000 new TB cases annually, corresponding to an incidence of 157 per 100,000 population. Of these, HIV co-infection accounts for 9,400 cases, and 13,000 deaths are attributed to TB each year [<xref ref-type="bibr" rid="ref2">2</xref>]. Reported treatment coverage is approximately 71%, indicating persistent gaps in access to diagnosis and care. Previous studies have shown that TB does not distribute evenly across Thailand but rather clusters in several areas, particularly along international border regions [<xref ref-type="bibr" rid="ref3">3</xref>]. These geographic and health-system disparities highlight the need for analytical approaches that integrate epidemiological, clinical, and health service data to support more precise and equitable TB control.</p><p>Mathematical models, particularly compartmental models such as the SEIR (susceptible-exposed-infectious-recovered) framework, have been widely used to study TB epidemiology. Unlike the classical SIR model, the SEIR framework explicitly includes an exposed compartment representing individuals who are infected but not yet infectious, thereby accounting for the latent stage before progression to active TB disease [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. However, classical SEIR-based approaches often rely on simplifying assumptions, such as homogeneous mixing and fixed transition rates between compartments. These approaches may have limited ability to capture individual-level heterogeneity in clinical risk, health care access, and treatment outcomes.</p><p>Researchers are increasingly applying machine learning (ML) methods to TB-related predictive tasks, such as incidence prediction, diagnosis, and treatment outcome prediction [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. These approaches can exploit high-dimensional, heterogeneous data and demonstrate strong predictive performance for specific TB-related outcomes. ML-based approaches have also been incorporated into clinical decision support systems to assist with diagnostic and treatment decision-making [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. However, most existing studies focus on isolated prediction tasks and do not explicitly link individual-level risk estimation with broader epidemiological disease-stage structures.</p><p>The strengths of SEIR-based epidemiological models and ML approaches are complementary. SEIR-based frameworks [<xref ref-type="bibr" rid="ref10">10</xref>] provide a structured way to conceptualize disease progression at the population level, whereas ML approaches enable data-driven prediction of observable individual-level outcomes from clinical and surveillance data. However, there remains limited evidence on how routine TB surveillance data can be organized within an epidemiologically informed framework to generate practical predictions of treatment outcomes, mortality, and treatment delays. This gap is particularly important in settings where surveillance systems contain rich programmatic data, but practitioners do not routinely use them for risk stratification or decision support.</p><p>TB control in Thailand is primarily implemented through health care facility&#x2013;based diagnosis, registration, and treatment reporting. In contrast, routine programmatic reporting remains centered on surveillance and treatment monitoring rather than risk-prediction tools. Ongoing programmatic work includes surveillance and focused interventions for key high-risk or vulnerable populations, such as people living with HIV, prisoners, migrants, older adults, and non-Thai populations [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Thailand has established the National Tuberculosis Information Program (NTIP) as a national online TB reporting system. However, there are gaps in translating surveillance data into analytical tools that can support decision-making at different levels of the health care system.</p><p>NTIP is Thailand&#x2019;s national TB reporting system that collects data on diagnoses, treatment registrations, and outcomes from health care facilities [<xref ref-type="bibr" rid="ref13">13</xref>]. While NTIP provides a standardized national dataset, it reflects diagnosed and registered TB cases and does not capture unobserved infection or transmission processes. These characteristics make NTIP suitable for developing predictive models focused on routinely observed clinical and programmatic outcomes. Integration of NTIP data with analytical models that combine an epidemiologically informed structure and predictive modeling may support more systematic use of surveillance data for risk stratification and policy planning.</p><p>Therefore, this study aimed to develop and evaluate a TB surveillance framework based on an SEIR-informed conceptual structure and predictive models using NTIP data from Chiang Mai Province. Specifically, the study aimed to assess whether routinely collected surveillance data could support risk prediction, risk stratification, and public health decision-making for TB outcomes in a resource-limited setting.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>This retrospective cohort study used routine surveillance data to develop a TB surveillance framework that combines an SEIR-informed conceptual structure with individual-level predictive models. We used the SEIR framework [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] to guide the conceptual organization of TB disease stages. Empirical modeling focused on clinical and programmatic outcomes recorded in NTIP, including treatment success, mortality, and time to treatment initiation.</p><p>Within this framework, NTIP provided data on diagnosed and registered TB cases, treatment outcomes, deaths, and treatment initiation dates. Registered TB cases represented the observed infectious state among patients captured by the surveillance system. We operationalized recovery-related outcomes as treatment success, and we used recorded deaths to represent mortality. NTIP did not directly capture susceptible and exposed populations; therefore, we retained them as conceptual components of the SEIR-informed framework. <xref ref-type="table" rid="table1">Table 1</xref> summarizes the observability and operationalization of SEIR-D (susceptible-exposed-infectious-recovered-death) components in NTIP data.</p><p>The study, therefore, linked an epidemiologically informed disease-stage framework with predictive modeling of observed outcomes among patients diagnosed with and registered for TB.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Summarizes the observability and operationalization of SEIR-D (susceptible-exposed-infectious-recovered-death) components in the National Tuberculosis Information Program (NTIP) data<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Component</td><td align="left" valign="bottom">Epidemiological meaning</td><td align="left" valign="bottom">NTIP observability</td><td align="left" valign="bottom">Operationalization in this study</td></tr></thead><tbody><tr><td align="left" valign="top">Susceptible</td><td align="left" valign="top">Population at risk of TB<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> infection</td><td align="left" valign="top">Not directly observed</td><td align="left" valign="top">Conceptual component of the SEIR-informed framework</td></tr><tr><td align="left" valign="top">Exposed</td><td align="left" valign="top">Individuals with TB infection before registered active TB disease</td><td align="left" valign="top">Not directly observed</td><td align="left" valign="top">Conceptual component of the SEIR-informed framework</td></tr><tr><td align="left" valign="top">Infectious</td><td align="left" valign="top">Diagnosed active TB cases</td><td align="left" valign="top">Observed among registered cases</td><td align="left" valign="top">Registered TB cases recorded in NTIP</td></tr><tr><td align="left" valign="top">Recovered</td><td align="left" valign="top">Successful treatment outcome</td><td align="left" valign="top">Observed</td><td align="left" valign="top">Treatment success recorded in NTIP</td></tr><tr><td align="left" valign="top">Death</td><td align="left" valign="top">Death during treatment or follow-up</td><td align="left" valign="top">Observed</td><td align="left" valign="top">Death recorded in NTIP treatment outcome data</td></tr><tr><td align="left" valign="top">Treatment delay</td><td align="left" valign="top">Interval from diagnosis to treatment initiation</td><td align="left" valign="top">Observed</td><td align="left" valign="top">Days between diagnosis and treatment initiation</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>SEIR-D components were defined within an SEIR-informed conceptual framework and operationalized according to the structure of the NTIP surveillance dataset. Susceptible and exposed populations were not directly observed in NTIP and were retained as conceptual components. Empirical analyses focused on registered TB cases, treatment success, death, and time to treatment initiation. Treatment delay was considered a programmatic interval rather than a disease-state compartment.</p></fn><fn id="table1fn2"><p><sup>b</sup>TB: tuberculosis.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Study Area and Data Sources</title><p>Data were obtained from the NTIP, including records of patients with TB registered in Chiang Mai Province between October 2020 and September 2024. The NTIP database provided individual-level data on diagnosis, treatment registration, comorbidities, and treatment outcomes.</p></sec><sec id="s2-3"><title>Inclusion and Exclusion Criteria</title><p>The study population consisted of patients registered for TB treatment in NTIP during the study period. We excluded patients with missing values for key variables required for model development, including age, sex, district of residence, treatment initiation date, or treatment outcome. These variables were required to define the analytical cohort, predictor structure, and primary outcomes. The analytical dataset comprised 5557 cases after data cleaning and eligibility screening based on variable completeness. Records were excluded only when missingness involved variables essential for defining the analytical cohort, primary outcomes, or model structure; we addressed missing values in nonessential variables separately using multiple imputation.</p></sec><sec id="s2-4"><title>Data Management and Preparation</title><p>The key variables in the analytical dataset were age, sex, district of residence, date of treatment initiation, and treatment outcome. Records with missing values in key analytical variables were excluded. Missing values were imputed for nonessential variables, such as selected comorbidities and health care system indicators, using multiple imputation by chained equations, which generated 20 imputed datasets to account for the uncertainty of the imputed values and to reduce potential bias associated with complete-case analysis [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. The imputation model included observed demographic, clinical, and health system variables and assumed a missing-at-random mechanism conditional on these observed variables. This approach is consistent with established recommendations for handling incomplete observational data when missingness is assumed to be conditional on observed variables [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>BMI, comorbidities, HIV status, insurance status, and other predictor variables were recorded at TB registration or initial clinical assessment and used as baseline predictors for subsequent recorded outcomes. A BMI of less than 18.5 kg/m<sup>2</sup> was defined using the BMI value recorded at registration or initial assessment. We used the Tukey fences and the isolation forest algorithm [<xref ref-type="bibr" rid="ref17">17</xref>] to identify outliers. We set the contamination parameter of the isolation forest algorithm to 0.05, and we checked model outputs for clinical plausibility. Residence categories were defined using geographic accessibility to TB services, including the distance from residence to treatment facilities. Urban residence, representing the most accessible category, was used as the reference group for residence variables. All eligible records were retained for model development and assessed using train-test splitting and internal cross-validation.</p></sec><sec id="s2-5"><title>Development of Predictive Models</title><p>We conducted predictive modeling using observable outcomes from the final analytic NTIP dataset of 5557 TB cases. We selected models according to the structure of the recorded outcomes and the statistical requirements of each prediction task. We applied logistic regression for binary treatment success [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], the Cox proportional hazards model for time-to-event mortality with censoring [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>], and the log-normal accelerated failure time model for time to treatment initiation [<xref ref-type="bibr" rid="ref20">20</xref>]. This approach allowed each model to correspond to the scale, timing, and censoring structure of each outcome under analysis. Because NTIP records diagnosed and registered TB cases rather than the full susceptible or exposed population, model construction focused on clinical and programmatic outcomes available among registered patients. The SEIR framework was used to organize disease-stage concepts, consistent with compartmental modeling approaches that distinguish susceptible, exposed, infectious, and recovered states [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p><p>A multivariable logistic regression model was used to predict treatment success as a binary outcome, selected for its interpretability and suitability for clinical decision-making [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. A Cox proportional hazards model [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>] was used to estimate the hazard of death with time-to-event data, accounting for censoring. We tested the proportional hazards assumption using Schoenfeld residuals. We fitted an accelerated failure time model with a log-normal distribution to estimate delays between diagnosis and treatment initiation; this approach estimates the effect of covariates on event time rather than on the hazard function [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>Together, these models estimated binary outcomes, time-to-event risks, and delays within a unified analytical framework based on recorded clinical and programmatic end points, including treatment success, mortality, and diagnosis-to-treatment delay. We specified the predictive models for recorded outcomes rather than for latent or unobserved transmission states. Model performance was assessed using discrimination and calibration metrics, including the area under the receiver operating characteristic curve (AUC) for classification models [<xref ref-type="bibr" rid="ref22">22</xref>] and concordance-based measures for survival models [<xref ref-type="bibr" rid="ref23">23</xref>].</p></sec><sec id="s2-6"><title>Model Training and Validation</title><p>We assessed model performance using a train-test split (train: 4446/5557, 80%; test: 1111/5557, 20%) and performed internal validation using 10-fold stratified cross-validation on the training set. For classification models, the AUC was used as a performance metric [<xref ref-type="bibr" rid="ref22">22</xref>]. For survival models, the Harrell Concordance Index was used as a performance metric [<xref ref-type="bibr" rid="ref23">23</xref>]. We assessed prediction error for the time-to-treatment model using root mean squared error and mean absolute error. Additionally, we assessed the goodness-of-fit of the logistic regression model using the Hosmer-Lemeshow test [<xref ref-type="bibr" rid="ref17">17</xref>]. We assessed discrimination, calibration, and prediction error across outcome types and model specifications.</p></sec><sec id="s2-7"><title>Management of Conflicting Outcomes</title><p>We analyzed mortality and treatment success as separate outcome-specific end points. We modeled mortality using time-to-event methods, whereas we modeled treatment success as a binary outcome. We applied this outcome-specific modeling strategy to support risk stratification across different stages of the TB care pathway. We interpreted estimates as predictive associations rather than causal effects.</p></sec><sec id="s2-8"><title>Analysis of Scenarios</title><p>We performed scenario analyses to assess projected changes in detection-related indicators, treatment coverage, and mortality under predefined modeled assumptions. The baseline scenario represented the observed provincial TB program conditions prior to applying the modeled changes. Baseline values included the provincial detection-related indicator, treatment coverage, and mortality rate, which were derived from Chiang Mai provincial TB program indicators. We derived the time to treatment initiation from recorded diagnosis and treatment initiation dates in NTIP and modeled it separately using a log-normal accelerated failure time model.</p><p>We represented screening as a programmatic process related to case detection rather than as a disease-state compartment. We specified detection-related changes as proportional changes relative to provincial TB program baseline indicators. We represented changes in treatment processes using predefined relative changes in treatment coverage and mortality, which were applied to provincial baseline indicators.</p><p>In the baseline scenario, the detection-related indicator was 87.08%, treatment coverage was 71.90%, and mortality was 11.90% [<xref ref-type="bibr" rid="ref12">12</xref>]. The scenario parameters for detection-related improvement, treatment coverage improvement, and mortality reduction were predefined assumptions rather than estimates from an observed intervention. We, therefore, interpreted scenario outcomes as model-based projections rather than observed intervention effects, consistent with the use of modeling approaches to inform public health decision-making in the absence of direct population-level evidence [<xref ref-type="bibr" rid="ref24">24</xref>].</p></sec><sec id="s2-9"><title>Statistical Analysis and Software</title><p>We conducted all analyses using R (version 4.1.2; R Foundation for Statistical Computing) and Python (version 3.11; Python Software Foundation). We defined statistical significance as <italic>P</italic>&#x003C;.05, and we reported all estimates with 95% CI. As NTIP represents a registry of reported TB cases rather than a sampled survey dataset, we therefore did not apply survey weighting. Given the analysis&#x2019;s predictive and exploratory focus, we instead emphasized effect estimates, CI, and model performance metrics rather than confirmatory hypothesis testing.</p></sec><sec id="s2-10"><title>Ethical Considerations</title><p>The research ethics committee of the Faculty of Public Health, Chiang Mai University (approval: ET030/2025) and the Chiang Mai Provincial Public Health Office approved the study protocol. We anonymized all data prior to analysis and retained no identifiable personal information. Data were stored in secure, encrypted systems in accordance with applicable data protection regulations.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Demographic, Clinical, and Health Care Access Characteristics of the Study Participants</title><p>This study analyzed 5557 TB cases recorded in the NTIP in Chiang Mai Province between 2020 and 2024. Most participants were male (3756, 67.6% cases), and the mean age was 45.3 (SD 14.8) years. HIV co-infection was present in 556 (10.0% cases), 1000 (18.0%) cases had diabetes mellitus, and 1223 (22.0%) cases had a BMI &#x003C;18.5 kg/m<sup>2</sup>. Health care access characteristics included absence of health insurance in 445 (8.0%) cases, rural residence in 1556 (28.0%) cases, and remote residence in 445 (8.0%) cases (<xref ref-type="table" rid="table2">Table 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Baseline demographic, clinical, and health care access characteristics of the study population (N=5557)<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristic</td><td align="left" valign="bottom">Values</td></tr></thead><tbody><tr><td align="left" valign="top">Male sex, n (%)</td><td align="left" valign="top">3756 (67.6)</td></tr><tr><td align="left" valign="top">Age (y), mean (SD)</td><td align="left" valign="top">45.3 (14.8)</td></tr><tr><td align="left" valign="top">HIV-positive, n (%)</td><td align="left" valign="top">556 (10.0)</td></tr><tr><td align="left" valign="top">Diabetes mellitus, n (%)</td><td align="left" valign="top">1000 (18.0)</td></tr><tr><td align="left" valign="top">BMI (&#x003C;18.5 kg/m<sup>2</sup>), n (%)</td><td align="left" valign="top">1223 (22.0)</td></tr><tr><td align="left" valign="top">No health insurance, n (%)</td><td align="left" valign="top">445 (8.0)</td></tr><tr><td align="left" valign="top">Rural residence, n (%)</td><td align="left" valign="top">1556 (28.0)</td></tr><tr><td align="left" valign="top">Remote residence, n (%)</td><td align="left" valign="top">445 (8.0)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Baseline demographic, clinical, and health care access characteristics of National Tuberculosis Information Program&#x2013;registered patients with tuberculosis in Chiang Mai Province, Thailand, 2020&#x2010;2024. Data are presented as n (%) or mean (SD).</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Predictive Model Performance</title><p>Predictive models demonstrated good performance across recorded TB outcomes. The AUC for the treatment success model was 0.88 (95% CI 0.86&#x2010;0.90), indicating good discrimination. The mortality model showed the Harrell Concordance Index of 0.86 (95% CI 0.84&#x2010;0.88), indicating good concordance between predicted and observed survival outcomes. We summarized prediction error for time to treatment initiation using root mean squared error and mean absolute error, with values of 8.2 days and 5.7 days, respectively. The logistic regression model was adequately calibrated, with no evidence of poor fit based on the Hosmer-Lemeshow test (<italic>P</italic>&#x003E;.05; <xref ref-type="table" rid="table3">Table 3</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance of predictive models for tuberculosis outcomes<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Outcome</td><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Performance metric</td></tr></thead><tbody><tr><td align="left" valign="top">Treatment success</td><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">AUC<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>=0.88 (95% CI 0.86&#x2010;0.90)</td></tr><tr><td align="left" valign="top">Mortality</td><td align="left" valign="top">Cox proportional hazards model</td><td align="left" valign="top">Harrell Concordance Index=0.86 (95% CI 0.84&#x2010;0.88)</td></tr><tr><td align="left" valign="top">Time to treatment initiation</td><td align="left" valign="top">Log-normal AFT<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> model</td><td align="left" valign="top">RMSE<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup>=8.2 days; MAE<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup>=5.7 days<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Performance metrics of predictive models for tuberculosis outcomes in a retrospective cohort of National Tuberculosis Information Program&#x2013;registered patients in Chiang Mai Province, Thailand, 2020&#x2010;2024. </p></fn><fn id="table3fn2"><p><sup>b</sup>AUC: area under the receiver operating characteristic curve.</p></fn><fn id="table3fn3"><p><sup>c</sup>AFT: accelerated failure time.</p></fn><fn id="table3fn4"><p><sup>d</sup>RMSE: root mean squared error.</p></fn><fn id="table3fn5"><p><sup>e</sup>MAE: mean absolute error.</p></fn><fn id="table3fn6"><p><sup>f</sup>RMSE and MAE represent prediction errors for the time to treatment initiation, expressed in days.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Treatment Success as a Recovery-Related Outcome</title><p>We modeled treatment success as the recovery-related outcome recorded in NTIP. The logistic regression model for treatment success demonstrated good discrimination, with an AUC of 0.88 (95% CI 0.86&#x2010;0.90), indicating that routinely recorded clinical and programmatic variables are informative for classifying treatment success among registered patients with TB.</p></sec><sec id="s3-4"><title>Factors Associated With Mortality</title><p>HIV infection was associated with higher mortality among patients with TB (HR 5.80; 95% CI 4.20&#x2010;7.90; <italic>P</italic>&#x003C;.001). Patients aged older than 65 years with HIV co-infection had the highest estimated mortality risk (HR 12.30; 95% CI 8.90&#x2010;16.40; <italic>P</italic>&#x003C;.001). Higher mortality was also associated with diabetes mellitus (HR 3.10; 95% CI 2.30&#x2010;4.40; <italic>P</italic>&#x003C;.001) and a BMI of less than 18.5 kg/m<sup>2</sup> (HR 2.30; 95% CI 1.70&#x2010;3.10; <italic>P</italic>&#x003C;.001; <xref ref-type="table" rid="table4">Table 4</xref>). We present these estimates as outcome-specific associations from the mortality model.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Factors associated with mortality<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Factor</td><td align="left" valign="bottom" colspan="2">HR<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (95% CI)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">HIV-positive</td><td align="left" valign="top" colspan="2">5.80 (4.20&#x2010;7.90)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Age (&#x003E;65 y with HIV co-infection)</td><td align="left" valign="top" colspan="2">12.30 (8.90&#x2010;16.40)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Diabetes mellitus</td><td align="left" valign="top" colspan="2">3.10 (2.30&#x2010;4.40)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">BMI (&#x003C;18.5 kg/m<sup>2</sup>)</td><td align="left" valign="top" colspan="2">2.30 (1.70&#x2010;3.10)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>Factors associated with mortality among patients with tuberculosis in Chiang Mai Province, Thailand, from 2020 to 2024. Hazard ratios were estimated using Cox proportional hazards models.</p></fn><fn id="table4fn2"><p><sup>b</sup>HR: hazard ratio.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Factors Associated With Treatment Delay</title><p>Treatment delays were longer among individuals living in rural and remote areas than among those living in urban areas. Rural residence was associated with an average delay of 12 (95% CI 9&#x2010;15) days, remote residence with 18 (95% CI 14&#x2010;22) days, lack of health insurance with 8 (95% CI 6&#x2010;10) days, and age &#x003E;70 years with 6 (95% CI 4&#x2010;9) days (<xref ref-type="table" rid="table5">Table 5</xref>). We present treatment-delay estimates as mean differences with 95% CI.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Factors associated with treatment delays<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup>.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Factor</td><td align="left" valign="bottom" colspan="2">Days, mean difference (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">Rural residence</td><td align="left" valign="top" colspan="2">12 (9&#x2010;15)</td></tr><tr><td align="left" valign="top">Remote residence</td><td align="left" valign="top" colspan="2">18 (14&#x2010;22)</td></tr><tr><td align="left" valign="top">No health insurance</td><td align="left" valign="top" colspan="2">8 (6&#x2010;10)</td></tr><tr><td align="left" valign="top">Age (&#x003E;70 y)</td><td align="left" valign="top" colspan="2">6 (4&#x2010;9)</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>Factors associated with treatment delay among patients with tuberculosis in Chiang Mai Province, Thailand, 2020&#x2010;2024. Estimates represent differences in the expected time to treatment initiation derived from the accelerated failure time model. Urban residence, the most accessible residence category, was used as the reference group for rural and remote residence estimates.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-6"><title>Simulation Results of Modeled Scenarios</title><p>We derived baseline values for scenario comparisons from Chiang Mai provincial TB program indicators. The scenario analysis did not model the redistribution of specific resources between geographic risk areas. Instead, it represented potential programmatic improvements in detection-related indicators, treatment coverage, and mortality under predefined assumptions. Under these modeled scenarios, the models projected detection-related indicators to increase by 25% (95% CI 22&#x2010;28), treatment coverage by 15% (95% CI 12&#x2010;18), and mortality to decrease by 20% (95% CI 16&#x2010;24) relative to baseline conditions (<xref ref-type="table" rid="table6">Table 6</xref>). Readers should interpret these projections as scenario-based estimates rather than as observed effects of resource reallocation or implemented program changes.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Projected outcomes under modeled scenarios relative to provincial baseline indicators<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup>.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Outcome</td><td align="left" valign="bottom">Provincial baseline (%)</td><td align="left" valign="bottom">Projected change (%)</td><td align="left" valign="bottom">95% CI (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Detection-related indicators</td><td align="left" valign="top">87.08</td><td align="left" valign="top">+25</td><td align="left" valign="top">22&#x2010;28</td></tr><tr><td align="left" valign="top">Treatment coverage</td><td align="left" valign="top">71.90</td><td align="left" valign="top">+15</td><td align="left" valign="top">12&#x2010;18</td></tr><tr><td align="left" valign="top">Mortality</td><td align="left" valign="top">11.90</td><td align="left" valign="top">&#x2013;20</td><td align="left" valign="top">16&#x2010;24</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>Projected outcomes under modeled scenarios are relative to provincial baseline indicators in Chiang Mai Province, Thailand. Estimates represent model-based projections under predefined assumptions and do not reflect observed intervention effects or implemented program changes. Baseline values were obtained from provincial tuberculosis program indicators.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study examined TB outcomes using routinely collected surveillance data and applied predictive modeling to identify factors associated with mortality and treatment delay. The findings suggest distinct patterns in TB outcomes, where mortality was more strongly associated with clinical vulnerability, while treatment delay was more closely related to health care access factors. By examining these outcomes within a unified surveillance-based analytical framework, this study highlights the importance of distinguishing between clinical risk factors and health care access barriers when designing TB control strategies, as these domains reflect distinct yet interacting pathways that influence patient outcomes.</p><p>The SEIR-informed framework provided a structure for organizing disease-stage concepts, and the predictive models focused on recorded clinical and programmatic outcomes in NTIP, including treatment success, mortality, and time to treatment initiation. This approach linked an epidemiological disease-stage perspective with practical risk stratification using routinely collected surveillance data.</p></sec><sec id="s4-2"><title>Comparison With Previous Studies</title><p>The association between HIV co-infection and higher mortality observed in this study (HR=5.80) is consistent with prior survival analyses showing reduced survival among patients with TB or HIV coinfection [<xref ref-type="bibr" rid="ref25">25</xref>] and cohort evidence identifying HIV positivity as a predictor of mortality among patients with TB [<xref ref-type="bibr" rid="ref26">26</xref>]. The relatively high magnitude of association observed in this study may, therefore, reflect not only HIV-related clinical vulnerability and the increased complexity of clinical management in patients with coinfection, but also contextual factors such as diagnostic timing and health system access, which previous studies have identified as contributors to diagnostic delays and poorer TB outcomes [<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>In addition to HIV co-infection, baseline metabolic and nutritional factors also appear relevant to TB outcomes. The associations observed for diabetes are consistent with data from prospective cohorts, indicating that diabetes and prediabetes are associated with adverse TB treatment outcomes [<xref ref-type="bibr" rid="ref28">28</xref>]. Moreover, prior research has linked dysglycemia to more severe disease presentation, including higher radiographic severity and increased bacillary load, as well as increased TB lethality among patients with diabetes [<xref ref-type="bibr" rid="ref29">29</xref>]. Low BMI may indicate nutritional vulnerability and should be interpreted in the context of a broader clinical risk profile rather than as an independent predictor, consistent with survival analyses demonstrating the significance of baseline clinical characteristics in shaping TB mortality risk [<xref ref-type="bibr" rid="ref26">26</xref>].</p><p>In addition to these clinical risk factors, health system and access-related barriers also contributed to differences in TB outcomes. Regarding treatment delay, the finding that rural and remote populations experienced longer delays is consistent with systematic review evidence indicating that delays in diagnosis and treatment of TB continue to be important barriers to TB control [<xref ref-type="bibr" rid="ref27">27</xref>]. One suggested approach to reduce these access gaps is active case-finding, particularly through community-based approaches [<xref ref-type="bibr" rid="ref30">30</xref>] and screening in general or at-risk populations [<xref ref-type="bibr" rid="ref31">31</xref>]. However, these approaches are likely to be most effective when implemented with appropriate coverage and linked to timely diagnosis and treatment initiation. These findings suggest that geographic variation in treatment delay may reflect underlying disparities in health care access and care pathways rather than solely spatial disease patterns.</p></sec><sec id="s4-3"><title>Interpretation and Implications</title><p>From a methodological perspective, the results are consistent with a broader pattern in the TB modeling literature, in which different modeling approaches capture different aspects of the disease process. Researchers have applied ML methods to address several TB-related predictive tasks, including diagnostic classification with high-dimensional serological data [<xref ref-type="bibr" rid="ref32">32</xref>], incidence prediction using meteorological and air pollution data [<xref ref-type="bibr" rid="ref6">6</xref>], and treatment outcome prediction using routinely available clinical indicators [<xref ref-type="bibr" rid="ref33">33</xref>]. Recent work has also examined the use of ML for TB incidence forecasting within broader epidemiological modeling frameworks [<xref ref-type="bibr" rid="ref34">34</xref>]. Such approaches are often designed to optimize predictive accuracy; however, they may have limited interpretability regarding underlying disease mechanisms, particularly when the observed data include only diagnosed and reported cases rather than the full spectrum of transmission dynamics.</p><p>Mechanistic models, particularly SEIR-based approaches, provide a structured framework for conceptualizing disease progression and population-level disease dynamics [<xref ref-type="bibr" rid="ref35">35</xref>] and have been extended to examine TB dynamics under different modeling assumptions [<xref ref-type="bibr" rid="ref36">36</xref>]. Nevertheless, such models often rely on simplifying assumptions and may not fully capture real-world heterogeneity or individual-level risk. In this study, we used the SEIR framework conceptually to organize disease stages, while applying predictive models to recorded outcomes in routine surveillance data. The analysis, therefore, focused on recorded clinical and programmatic outcomes rather than population-level transmission dynamics. This approach supports alignment between theoretical disease-stage concepts and the structure of routinely available surveillance data.</p><p>Recent advances in hybrid TB modeling suggest that integrating mechanistic models with ML may provide a more balanced framework that supports predictive performance while maintaining epidemiological interpretability [<xref ref-type="bibr" rid="ref37">37</xref>]. In this study, this integration was applied at a conceptual level, reflecting the structure and constraints of routine surveillance data. The study demonstrates a practical approach to organizing surveillance data within an epidemiologically informed framework to support the prediction of recorded TB outcomes and risk stratification.</p><p>The literature has well established that TB epidemiology exhibits spatial heterogeneity, with geographic variation observed across spatial and socioeconomic contexts [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. More recently, work using satellite imagery and urban density measures has shown that spatial proxies may help identify areas for targeted active case-finding, while highlighting the need for cautious interpretation of geographic risk patterns [<xref ref-type="bibr" rid="ref39">39</xref>]. The observed association between geographic residence and treatment delay suggests that spatial disparities in TB outcomes are attributable to differences in health care access and service availability. However, spatial clustering does not necessarily reflect transmission dynamics, and geographic variation may also be due to differences in health care access, reporting systems, population structure, and socioeconomic conditions. This distinction is important because outcomes may vary geographically due to both epidemiological and health-system factors.</p><p>From a programmatic perspective, the findings suggest that interventions targeting both early case detection and reduction of structural barriers to health care access may be needed to improve TB outcomes, rather than applying a uniform strategy across all populations. This distinction has implications for intervention design, as strategies to address clinical risk (eg, comorbidity management) may differ substantially from those intended to address access barriers (eg, service decentralization or active case-finding). This interpretation is consistent with the scenario analyses presented in this study, which show that improvements in detection and treatment processes could be associated with changes in projected outcomes under modeled assumptions. These projections provide scenario-based estimates of possible implications for programs, and readers should interpret them in the context of the assumptions and baseline indicators used in the analysis.</p><p>Targeted case-finding strategies may help improve access to diagnosis, especially in high-risk populations. However, delays in TB care are multifactorial and influenced by both patient- and health system&#x2013;level factors [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. The effectiveness of these approaches may, therefore, depend on both expanded access and integration into routine care pathways. In practical terms, predictive outputs may help TB programs prioritize active follow-up, outreach screening, referral support, patient navigation, and closer monitoring for clinically vulnerable patients or those living in underserved areas. Further implementation research is needed to determine whether these outputs should guide additional resources, the redistribution of existing resources, or both. Digital health technologies and clinical decision support systems may facilitate implementation [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref40">40</xref>], but future studies should evaluate their practical impact in real-world clinical and public health settings.</p></sec><sec id="s4-4"><title>Strengths</title><p>This study used a large dataset derived from a routine TB surveillance system, supporting the relevance of the findings to real-world programmatic settings. The analysis considered multiple outcomes, including treatment success, mortality, and time to treatment initiation, allowing for a broader assessment of the TB care pathway. In addition, the use of established statistical approaches supported risk stratification and the identification of high-risk subgroups using routinely available data. These strengths may enhance the applicability of the findings to TB control programs, although readers should interpret the results within the context of surveillance-based data.</p><p>A further strength of the study is the alignment between the analytical methods and the structure of the available surveillance data. By focusing on recorded outcomes, the framework supports practical interpretation for routine programmatic settings while retaining an epidemiologically informed structure for organizing disease-stage concepts.</p></sec><sec id="s4-5"><title>Limitations</title><p>This study has several important limitations. First, the use of routinely collected surveillance data may be subject to missing data, misclassification, and variability in data quality across reporting sites. Important variables, including socioeconomic status, income, education, migrant status, health care-seeking behavior, timing of symptom onset, and distance to health care facilities, may not have been consistently recorded. Their absence may have introduced residual confounding, particularly in the analysis of treatment delay, as unmeasured social and structural barriers may partly explain the observed associations between rural or remote residence and delayed treatment initiation. The study period also overlapped with the COVID-19 pandemic, which may have affected health care-seeking behavior, TB screening activities, diagnostic access, reporting completeness, and time to treatment initiation [<xref ref-type="bibr" rid="ref41">41</xref>].</p><p>Second, the study was based on registered TB cases in NTIP and may not capture undiagnosed cases, unreported cases, or individuals who did not access care. Readers should therefore interpret the findings as reflecting patterns among registered patients rather than the full burden and heterogeneity of TB in the underlying population. Because NTIP includes diagnosed and registered patients with TB, it cannot directly estimate the population-level effect of increased screening on undiagnosed or unreported cases. Readers should therefore interpret the assumed increase in screening or detection-related indicators in the scenario analysis as a programmatic assumption applied to provincial baseline indicators rather than as an effect estimated from the NTIP cohort itself.</p><p>Third, although we used the SEIR framework to guide the conceptual organization of disease stages, the available surveillance data did not directly observe susceptible or exposed populations, and we did not empirically estimate or validate SEIR transition parameters. Accordingly, readers should interpret the framework as SEIR-informed rather than as a fully parameterized transmission model. The observational design also limits causal inference; readers should interpret observed associations as predictive or outcome-specific rather than causal. In addition, combining an epidemiologically informed disease-stage framework with individual-level predictive models requires cautious interpretation; researchers should not directly infer population-level concepts from individual-level associations.</p><p>Finally, although we performed internal validation using train-test splitting and cross-validation, we did not conduct external validation using independent datasets. The models may perform differently in settings with varying epidemiological profiles, health care access patterns, population characteristics, reporting completeness, or data quality. The use of multiple predictors and outcome-specific models may also increase the risk of overfitting, particularly in subgroups or lower-frequency outcomes. We based the scenario analysis on predefined assumptions and provincial baseline indicators rather than observed intervention data; therefore, readers should interpret projected changes as illustrative programmatic projections. Future studies should compare performance with simpler baseline models, validate calibration and discrimination in independent datasets, examine sensitivity to scenario assumptions, and evaluate feasibility and implementation in routine TB control.</p></sec><sec id="s4-6"><title>Conclusions</title><p>TB outcomes in Chiang Mai Province reflected the combined influence of clinical vulnerability and health care access barriers. Mortality was more strongly associated with clinical factors, including HIV co-infection, older age, diabetes, and low BMI. In contrast, treatment delay was more closely related to rural or remote residence and lack of health insurance. These findings suggest that TB control strategies should combine intensified clinical monitoring for high-risk patients with improved access to timely diagnosis and treatment for underserved populations.</p><p>An SEIR-informed predictive framework using routine surveillance data may support risk stratification and program planning by identifying high-risk groups and access-related delays in the TB care pathway. The findings support practical actions such as active follow-up for patients with HIV co-infection or other clinical vulnerabilities, strengthened outreach and referral pathways in rural and remote areas, improved linkage to care for uninsured patients, and targeted prioritization of follow-up, outreach, and linkage-to-care activities.</p><p>Model-based scenario results suggest that improvements in detection-related indicators and treatment coverage could contribute to better TB outcomes under predefined assumptions. However, readers should interpret these projections cautiously because they are based on modeled scenarios rather than observed intervention effects. Before wider implementation, future studies should externally validate the predictive framework in independent datasets and evaluate it prospectively in routine TB control settings to assess feasibility, calibration, clinical usefulness, and impact on decision-making.</p></sec></sec></body><back><ack><p>The authors thank the staff of the Chiang Mai Provincial Tuberculosis Control Network and the public health personnel at all levels of the health system for their cooperation in data preparation and verification. The authors declare the use of generative AI during manuscript revision. ChatGPT by OpenAI was used under full human supervision to support text generation for revised wording, proofreading and editing, and reformatting. Generative AI was not used to generate original data, conduct statistical analyses, create or modify figures, select references independently, or make independent scientific interpretations. All AI-assisted content was reviewed, edited, verified, and approved by the authors. Responsibility for the accuracy, integrity, and final content of the manuscript lies entirely with the authors. Generative AI tools are not listed as authors and do not bear responsibility for the final outcomes.</p></ack><notes><sec><title>Funding</title><p>This research was supported by Chiang Mai University.</p></sec></notes><fn-group><fn fn-type="con"><p>PS conceptualized the study, performed the investigation, collected data, and drafted the original manuscript.</p><p>EB contributed to data analysis, curation, and editing.</p><p>AT conducted formal analysis and data curation, and contributed to writing and review. SM contributed to methodology development and critical review. SC was responsible for validation and manuscript review. WB supervised the overall study, provided resources, and served as the corresponding author. All authors read and approved the final version of this manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb2">HR</term><def><p>hazard ratio</p></def></def-item><def-item><term id="abb3">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb4">NTIP</term><def><p>National Tuberculosis Information Program</p></def></def-item><def-item><term id="abb5">SEIR</term><def><p>susceptible-exposed-infectious-recovered</p></def></def-item><def-item><term id="abb6">SEIR-D</term><def><p>susceptible-exposed-infectious-recovered-death</p></def></def-item><def-item><term id="abb7">TB</term><def><p>tuberculosis</p></def></def-item><def-item><term id="abb8">WHO</term><def><p>World Health Organization</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="report"><article-title>Global tuberculosis report 2025</article-title><year>2025</year><access-date>2026-06-11</access-date><publisher-name>World Health Organization</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://iris.who.int/server/api/core/bitstreams/e97dd6f4-b567-4396-8680-717bac6869a9/content">https://iris.who.int/server/api/core/bitstreams/e97dd6f4-b567-4396-8680-717bac6869a9/content</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>Tuberculosis profile: Thailand</article-title><source>World Health Organization</source><access-date>2026-04-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://worldhealthorg.shinyapps.io/tb_profiles/?_inputs_&#x0026;tab=%22charts%22&#x0026;lan=%22EN%22&#x0026;iso3=%22THA%22&#x0026;entity_type=%22country%22">https://worldhealthorg.shinyapps.io/tb_profiles/?_inputs_&#x0026;tab=%22charts%22&#x0026;lan=%22EN%22&#x0026;iso3=%22THA%22&#x0026;entity_type=%22country%22</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chinpong</surname><given-names>K</given-names> </name><name name-style="western"><surname>Thavornwattana</surname><given-names>K</given-names> </name><name name-style="western"><surname>Armatrmontree</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Spatiotemporal epidemiology of tuberculosis in Thailand from 2011 to 2020</article-title><source>Biology (Basel)</source><year>2022</year><month>05</month><day>16</day><volume>11</volume><issue>5</issue><fpage>755</fpage><pub-id pub-id-type="doi">10.3390/biology11050755</pub-id><pub-id pub-id-type="medline">35625483</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Side</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mulbar</surname><given-names>U</given-names> </name><name name-style="western"><surname>Sidjara</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sanusi</surname><given-names>W</given-names> </name></person-group><article-title>A SEIR model for transmission of tuberculosis</article-title><conf-name>The 4th International Conference on Mathematical Sciences &#x2013; Mathematical Sciences: Championing the Way in a Problem Based and Data Driven Society</conf-name><conf-date>Nov 15-17, 2016</conf-date><pub-id pub-id-type="doi">10.1063/1.4980867</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adi</surname><given-names>YA</given-names> </name></person-group><article-title>An investigation of Susceptible&#x2013;exposed&#x2013;infectious&#x2013;recovered (SEIR) tuberculosis model dynamics with pseudo-recovery and psychological effect</article-title><source>Healthcare Analytics</source><year>2024</year><month>12</month><volume>6</volume><fpage>100361</fpage><pub-id pub-id-type="doi">10.1016/j.health.2024.100361</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Yuan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Machine learning prediction model of tuberculosis incidence based on meteorological factors and air pollutants</article-title><source>Int J Environ Res Public Health</source><year>2023</year><month>02</month><day>22</day><volume>20</volume><issue>5</issue><fpage>3910</fpage><pub-id pub-id-type="doi">10.3390/ijerph20053910</pub-id><pub-id pub-id-type="medline">36900920</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bartl</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zeeb</surname><given-names>M</given-names> </name><name name-style="western"><surname>K&#x00E4;lin</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Machine learning-based prediction of active tuberculosis in people with HIV using clinical data</article-title><source>Clin Infect Dis</source><year>2025</year><month>10</month><day>6</day><volume>81</volume><issue>3</issue><fpage>521</fpage><lpage>530</lpage><pub-id pub-id-type="doi">10.1093/cid/ciaf149</pub-id><pub-id pub-id-type="medline">40132061</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Verboven</surname><given-names>L</given-names> </name><name name-style="western"><surname>Calders</surname><given-names>T</given-names> </name><name name-style="western"><surname>Callens</surname><given-names>S</given-names> </name><etal/></person-group><article-title>A treatment recommender clinical decision support system for personalized medicine: method development and proof-of-concept for drug resistant tuberculosis</article-title><source>BMC Med Inform Decis Mak</source><year>2022</year><month>03</month><day>2</day><volume>22</volume><issue>1</issue><fpage>56</fpage><pub-id pub-id-type="doi">10.1186/s12911-022-01790-0</pub-id><pub-id pub-id-type="medline">35236355</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>C</given-names> </name></person-group><article-title>Clinical assistant decision-making model of tuberculosis based on electronic health records</article-title><source>BioData Min</source><year>2023</year><month>03</month><day>16</day><volume>16</volume><issue>1</issue><fpage>11</fpage><pub-id pub-id-type="doi">10.1186/s13040-023-00328-y</pub-id><pub-id pub-id-type="medline">36927471</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hethcote</surname><given-names>HW</given-names> </name></person-group><article-title>The mathematics of infectious diseases</article-title><source>SIAM Rev</source><year>2000</year><month>01</month><day>1</day><volume>42</volume><issue>4</issue><fpage>599</fpage><lpage>653</lpage><pub-id pub-id-type="doi">10.1137/S0036144500371907</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jittimanee</surname><given-names>S</given-names> </name><name name-style="western"><surname>Vorasingha</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mad-asin</surname><given-names>W</given-names> </name><name name-style="western"><surname>Nateniyom</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rienthong</surname><given-names>S</given-names> </name><name name-style="western"><surname>Varma</surname><given-names>JK</given-names> </name></person-group><article-title>Tuberculosis in Thailand: epidemiology and program performance, 2001-2005</article-title><source>Int J Infect Dis</source><year>2009</year><month>07</month><volume>13</volume><issue>4</issue><fpage>436</fpage><lpage>442</lpage><pub-id pub-id-type="doi">10.1016/j.ijid.2008.07.025</pub-id><pub-id pub-id-type="medline">19013094</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="report"><person-group person-group-type="author"><collab>Division of Tuberculosis, Department of Disease Control</collab></person-group><article-title>The report on the implementation of the National Tuberculosis Control Program 2016&#x2013;2020</article-title><year>2022</year><publisher-name>Ministry of Public Health</publisher-name></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="report"><person-group person-group-type="author"><collab>Division of Tuberculosis, Department of Disease Control</collab></person-group><article-title>Report of the 6th Tuberculosis Joint International Monitoring Mission Thailand: 29 May to 6 June 2022</article-title><year>2022</year><publisher-name>Ministry of Public Health</publisher-name></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><source>Multiple Imputation for Nonresponse in Surveys</source><year>1987</year><publisher-name>John Wiley &#x0026; Sons</publisher-name><pub-id pub-id-type="doi">10.1002/9780470316696</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>van Buuren</surname><given-names>S</given-names> </name></person-group><source>Flexible Imputation of Missing Data</source><year>2018</year><edition>2</edition><publisher-name>Chapman and Hall/CRC</publisher-name><pub-id pub-id-type="doi">10.1201/9780429492259</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Azur</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Stuart</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Frangakis</surname><given-names>C</given-names> </name><name name-style="western"><surname>Leaf</surname><given-names>PJ</given-names> </name></person-group><article-title>Multiple imputation by chained equations: what is it and how does it work?</article-title><source>Int J Methods Psych Res</source><year>2011</year><month>03</month><volume>20</volume><issue>1</issue><fpage>40</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1002/mpr.329</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hosmer</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Lemeshow</surname><given-names>S</given-names> </name></person-group><source>Applied Logistic Regression</source><year>2000</year><publisher-name>John Wiley &#x0026; Sons</publisher-name><pub-id pub-id-type="doi">10.1002/0471722146</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name></person-group><source>Clinical Prediction Models: A Practical Approach to Development, Validation, and Updating</source><year>2009</year><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-0-387-77244-8</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cox</surname><given-names>DR</given-names> </name></person-group><article-title>Regression models and life-tables</article-title><source>J R Stat Soc Series B Stat Methodol</source><year>1972</year><month>01</month><day>1</day><volume>34</volume><issue>2</issue><fpage>187</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1111/j.2517-6161.1972.tb00899.x</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Kleinbaum</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>M</given-names> </name></person-group><source>Survival Analysis: A Self-Learning Text</source><year>2012</year><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-1-4419-6646-9</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Keeling</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Rohani</surname><given-names>P</given-names> </name></person-group><source>Modeling Infectious Diseases in Humans and Animals</source><year>2008</year><publisher-name>Princeton University Press</publisher-name><pub-id pub-id-type="doi">10.2307/j.ctvcm4gk0</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hanley</surname><given-names>JA</given-names> </name><name name-style="western"><surname>McNeil</surname><given-names>BJ</given-names> </name></person-group><article-title>The meaning and use of the area under a receiver operating characteristic (ROC) curve</article-title><source>Radiology</source><year>1982</year><month>04</month><volume>143</volume><issue>1</issue><fpage>29</fpage><lpage>36</lpage><pub-id pub-id-type="doi">10.1148/radiology.143.1.7063747</pub-id><pub-id pub-id-type="medline">7063747</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harrell</surname><given-names>FE</given-names>  <suffix>Jr</suffix></name><name name-style="western"><surname>Califf</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Pryor</surname><given-names>DB</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Rosati</surname><given-names>RA</given-names> </name></person-group><article-title>Evaluating the yield of medical tests</article-title><source>JAMA</source><year>1982</year><month>05</month><day>14</day><volume>247</volume><issue>18</issue><fpage>2543</fpage><lpage>2546</lpage><pub-id pub-id-type="doi">10.1001/jama.1982.03320430047030</pub-id><pub-id pub-id-type="medline">7069920</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dowdy</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Dye</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>T</given-names> </name></person-group><article-title>Data needs for evidence-based decisions: a tuberculosis modeler&#x2019;s &#x201C;wish list&#x201D;</article-title><source>Int J Tuberc Lung Dis</source><year>2013</year><month>07</month><volume>17</volume><issue>7</issue><fpage>866</fpage><lpage>877</lpage><pub-id pub-id-type="doi">10.5588/ijtld.12.0573</pub-id><pub-id pub-id-type="medline">23743307</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lelisho</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Wotale</surname><given-names>TW</given-names> </name><name name-style="western"><surname>Tareke</surname><given-names>SA</given-names> </name><etal/></person-group><article-title>Survival rate and predictors of mortality among TB/HIV co-infected adult patients: retrospective cohort study</article-title><source>Sci Rep</source><year>2022</year><month>11</month><day>1</day><volume>12</volume><issue>1</issue><fpage>18360</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-23316-4</pub-id><pub-id pub-id-type="medline">36319734</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xie</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Han</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name></person-group><article-title>Survival analysis of risk factors for mortality in a cohort of patients with tuberculosis</article-title><source>Can Respir J</source><year>2020</year><volume>2020</volume><fpage>1654653</fpage><pub-id pub-id-type="doi">10.1155/2020/1654653</pub-id><pub-id pub-id-type="medline">32963642</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bello</surname><given-names>S</given-names> </name><name name-style="western"><surname>Afolabi</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Ajayi</surname><given-names>DT</given-names> </name><etal/></person-group><article-title>Empirical evidence of delays in diagnosis and treatment of pulmonary tuberculosis: systematic review and meta-regression analysis</article-title><source>BMC Public Health</source><year>2019</year><month>06</month><day>25</day><volume>19</volume><issue>1</issue><fpage>820</fpage><pub-id pub-id-type="doi">10.1186/s12889-019-7026-4</pub-id><pub-id pub-id-type="medline">31238906</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arriaga</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Ara&#x00FA;jo-Pereira</surname><given-names>M</given-names> </name><name name-style="western"><surname>Barreto-Duarte</surname><given-names>B</given-names> </name><etal/></person-group><article-title>The effect of diabetes and prediabetes on antituberculosis treatment outcomes: a multicenter prospective cohort study</article-title><source>J Infect Dis</source><year>2022</year><month>02</month><day>15</day><volume>225</volume><issue>4</issue><fpage>617</fpage><lpage>626</lpage><pub-id pub-id-type="doi">10.1093/infdis/jiab427</pub-id><pub-id pub-id-type="medline">34651642</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bezerra</surname><given-names>AL</given-names> </name><name name-style="western"><surname>da Silva Rezende Moreira</surname><given-names>A</given-names></name><name name-style="western"><surname>Isidoro-Gon&#x00E7;alves</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Clinical, laboratory, and radiographic aspects of patients with pulmonary tuberculosis and dysglycemia and tuberculosis treatment outcomes</article-title><source>J Bras Pneumol</source><year>2022</year><volume>48</volume><issue>6</issue><fpage>e20210505</fpage><pub-id pub-id-type="doi">10.36416/1806-3756/e20210505</pub-id><pub-id pub-id-type="medline">36449815</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burke</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Nliwasa</surname><given-names>M</given-names> </name><name name-style="western"><surname>Feasey</surname><given-names>HRA</given-names> </name><etal/></person-group><article-title>Community-based active case-finding interventions for tuberculosis: a systematic review</article-title><source>Lancet Public Health</source><year>2021</year><month>05</month><volume>6</volume><issue>5</issue><fpage>e283</fpage><lpage>e299</lpage><pub-id pub-id-type="doi">10.1016/S2468-2667(21)00033-5</pub-id><pub-id pub-id-type="medline">33765456</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bohlbro</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Hvingelby</surname><given-names>VS</given-names> </name><name name-style="western"><surname>Rudolf</surname><given-names>F</given-names> </name><name name-style="western"><surname>Wejse</surname><given-names>C</given-names> </name><name name-style="western"><surname>Patsche</surname><given-names>CB</given-names> </name></person-group><article-title>Active case-finding of tuberculosis in general populations and at-risk groups: a systematic review and meta-analysis</article-title><source>Eur Respir J</source><year>2021</year><month>10</month><volume>58</volume><issue>4</issue><fpage>2100090</fpage><pub-id pub-id-type="doi">10.1183/13993003.00090-2021</pub-id><pub-id pub-id-type="medline">33766950</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rashidi</surname><given-names>HH</given-names> </name><name name-style="western"><surname>Dang</surname><given-names>LT</given-names> </name><name name-style="western"><surname>Albahra</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ravindran</surname><given-names>R</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>IH</given-names> </name></person-group><article-title>Automated machine learning for endemic active tuberculosis prediction from multiplex serological data</article-title><source>Sci Rep</source><year>2021</year><month>09</month><day>9</day><volume>11</volume><issue>1</issue><fpage>17900</fpage><pub-id pub-id-type="doi">10.1038/s41598-021-97453-7</pub-id><pub-id pub-id-type="medline">34504228</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Prediction of tuberculosis treatment outcomes using biochemical makers with machine learning</article-title><source>BMC Infect Dis</source><year>2025</year><month>02</month><day>17</day><volume>25</volume><issue>1</issue><fpage>229</fpage><pub-id pub-id-type="doi">10.1186/s12879-025-10609-y</pub-id><pub-id pub-id-type="medline">39962412</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>K B</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Jose</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Jirawattanapanit</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mathew</surname><given-names>K</given-names> </name></person-group><article-title>A comprehensive study on tuberculosis prediction models: integrating machine learning into epidemiological analysis</article-title><source>J Theor Biol</source><year>2025</year><month>01</month><day>21</day><volume>597</volume><fpage>111988</fpage><pub-id pub-id-type="doi">10.1016/j.jtbi.2024.111988</pub-id><pub-id pub-id-type="medline">39542168</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Biswas</surname><given-names>MHA</given-names> </name><name name-style="western"><surname>Paiva</surname><given-names>LT</given-names> </name><name name-style="western"><surname>de Pinho</surname><given-names>MDR</given-names> </name></person-group><article-title>A SEIR model for control of infectious diseases with constraints</article-title><source>Math Biosci Eng</source><year>2014</year><volume>11</volume><fpage>761</fpage><lpage>784</lpage><pub-id pub-id-type="doi">10.3934/mbe.2014.11.761</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ucakan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Gulen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Koklu</surname><given-names>K</given-names> </name></person-group><article-title>Analysing of tuberculosis in Turkey through SIR, SEIR and BSEIR mathematical models</article-title><source>Math Comput Model Dyn Syst</source><year>2021</year><month>01</month><day>2</day><volume>27</volume><issue>1</issue><fpage>179</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1080/13873954.2021.1881560</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghosh</surname><given-names>A</given-names> </name><name name-style="western"><surname>Das</surname><given-names>P</given-names> </name><name name-style="western"><surname>Das</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Das</surname><given-names>P</given-names> </name><name name-style="western"><surname>Upadhyay</surname><given-names>RK</given-names> </name></person-group><article-title>Forecasting tuberculosis through mechanistic learning of transmission dynamics: insights from a case study in India</article-title><source>Comput Biol Med</source><year>2025</year><month>11</month><volume>198</volume><issue>Pt B</issue><fpage>111225</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2025.111225</pub-id><pub-id pub-id-type="medline">41130159</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaweno</surname><given-names>D</given-names> </name><name name-style="western"><surname>Karmakar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Alene</surname><given-names>KA</given-names> </name><etal/></person-group><article-title>Methods used in the spatial analysis of tuberculosis epidemiology: a systematic review</article-title><source>BMC Med</source><year>2018</year><month>10</month><day>18</day><volume>16</volume><issue>1</issue><fpage>193</fpage><pub-id pub-id-type="doi">10.1186/s12916-018-1178-4</pub-id><pub-id pub-id-type="medline">30333043</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Faccin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Geenen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Happaerts</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ombelet</surname><given-names>S</given-names> </name><name name-style="western"><surname>Migambi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Andr&#x00E9;</surname><given-names>E</given-names> </name></person-group><article-title>Analyzing satellite imagery to target tuberculosis control interventions in densely urbanized areas of Kigali, Rwanda: cross-sectional pilot study</article-title><source>JMIR Public Health Surveill</source><year>2025</year><month>04</month><day>24</day><volume>11</volume><fpage>e68355</fpage><pub-id pub-id-type="doi">10.2196/68355</pub-id><pub-id pub-id-type="medline">40273403</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Raviglione</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Flahault</surname><given-names>A</given-names> </name></person-group><article-title>Use of digital technology to enhance tuberculosis control: scoping review</article-title><source>J Med Internet Res</source><year>2020</year><month>02</month><day>13</day><volume>22</volume><issue>2</issue><fpage>e15727</fpage><pub-id pub-id-type="doi">10.2196/15727</pub-id><pub-id pub-id-type="medline">32053111</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McQuaid</surname><given-names>CF</given-names> </name><name name-style="western"><surname>Vassall</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Fiekert</surname><given-names>K</given-names> </name><name name-style="western"><surname>White</surname><given-names>RG</given-names> </name></person-group><article-title>The impact of COVID-19 on TB: a review of the data</article-title><source>Int J Tuberc Lung Dis</source><year>2021</year><month>06</month><day>1</day><volume>25</volume><issue>6</issue><fpage>436</fpage><lpage>446</lpage><pub-id pub-id-type="doi">10.5588/ijtld.21.0148</pub-id><pub-id pub-id-type="medline">34049605</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Checklist 1</label><p>STROBE checklist.</p><media xlink:href="publichealth_v12i1e86495_app1.pdf" xlink:title="PDF File, 118 KB"/></supplementary-material></app-group></back></article>