<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id><journal-id journal-id-type="publisher-id">publichealth</journal-id><journal-id journal-id-type="index">9</journal-id><journal-title>JMIR Public Health and Surveillance</journal-title><abbrev-journal-title>JMIR Public Health Surveill</abbrev-journal-title><issn pub-type="epub">2369-2960</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e67840</article-id><article-id pub-id-type="doi">10.2196/67840</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Identifying Data-Driven Clinical Subgroups for Cervical Cancer Prevention With Machine Learning: Population-Based, External, and Diagnostic Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Lu</surname><given-names>Zhen</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dong</surname><given-names>Binhua</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cai</surname><given-names>Hongning</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tian</surname><given-names>Tian</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Junfeng</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fu</surname><given-names>Leiwen</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Bingyi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff8">8</xref><xref ref-type="aff" rid="aff9">9</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Weijie</given-names></name><degrees>BD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lin</surname><given-names>Shaomei</given-names></name><degrees>BD</degrees><xref ref-type="aff" rid="aff10">10</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tuo</surname><given-names>Xunyuan</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff11">11</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Juntao</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff12">12</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yang</surname><given-names>Tianjie</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff13">13</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Huang</surname><given-names>Xinxin</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff14">14</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zheng</surname><given-names>Zheng</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff13">13</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xue</surname><given-names>Huifeng</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff15">15</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xu</surname><given-names>Shuxia</given-names></name><degrees>BD</degrees><xref ref-type="aff" rid="aff16">16</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Siyang</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sun</surname><given-names>Pengming</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff17">17</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Zou</surname><given-names>Huachun</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff18">18</xref><xref ref-type="aff" rid="aff19">19</xref><xref ref-type="aff" rid="aff20">20</xref></contrib></contrib-group><aff id="aff1"><institution>School of Public Health (Shenzhen), Sun Yat-sen University</institution><addr-line>Shenzhen</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of Gynecology, Laboratory of Gynecologic Oncology, Fujian Maternity and Child Health Hospital, College of Clinical Medicine for Obstetrics &#x0026; Gynecology and Pediatrics, Fujian Medical University</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><aff id="aff3"><institution>Fujian Key Laboratory of Women and Children&#x2019;s Critical Diseases Research</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><aff id="aff4"><institution>Department of Gynecology, Maternal and Child Health Hospital of Hubei Province (Women and Children's Hospital of Hubei Province) Wuhan</institution><addr-line>Wuhan</addr-line><country>China</country></aff><aff id="aff5"><institution>School of Public Health, Xinjiang Medical University</institution><addr-line>Urumqi</addr-line><country>China</country></aff><aff id="aff6"><institution>Division of Pharmacoepidemiology and Clinical Pharmacology, Utrecht Institute for Pharmaceutical Sciences, Utrecht University</institution><addr-line>Utrecht</addr-line><country>Netherlands</country></aff><aff id="aff7"><institution>Beijing Chest Hospital, Capital Medical University, Beijing Tuberculosis and Thoracic Tumor Research Institute</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff8"><institution>Institute for HIV/AIDS Control and Prevention, Guangdong Provincial Center for Disease Control and Prevention</institution><addr-line>Guangzhou</addr-line><country>China</country></aff><aff id="aff9"><institution>Department of HIV/AIDS Control and Prevention, Guangdong Provincial Academy of Preventive Medicine</institution><addr-line>Guangzhou</addr-line><country>China</country></aff><aff id="aff10"><institution>Department of Gynecology, Shunde Women's and Children's Hospital of Guangdong Medical University</institution><addr-line>Foshan</addr-line><country>China</country></aff><aff id="aff11"><institution>Department of Gynecology, Gansu Provincial Maternity and Child-care Hospital</institution><addr-line>Lanzhou</addr-line><country>China</country></aff><aff id="aff12"><institution>Department of Gynecology, Guiyang Maternal and Child Health Care Hospital</institution><addr-line>Guiyang</addr-line><country>China</country></aff><aff id="aff13"><institution>Department of Gynecology, Shenzhen Maternity &#x0026; Child Healthcare Hospital</institution><addr-line>Shenzhen</addr-line><country>China</country></aff><aff id="aff14"><institution>The Ministry of Health, Fujian Maternity and Child Health Hospital, College of Clinical Medicine for Obstetrics &#x0026; Gynecology and Pediatrics, Fujian Medical University</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><aff id="aff15"><institution>Center for Cervical Disease Diagnosis and Treatment, Fujian Maternity and Child Health Hospital, College of Clinical Medicine for Obstetrics &#x0026; Gynecology and Pediatrics, Fujian Medical University</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><aff id="aff16"><institution>Department of Pathology, Fujian Maternity and Child Health Hospital, College of Clinical Medicine for Obstetrics &#x0026; Gynecology and Pediatrics, Fujian Medical University</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><aff id="aff17"><institution>School of Group Medicine and Public Health, Peking Union Medical College</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff18"><institution>School of Public Health, Fudan University</institution><addr-line>Shanghai</addr-line><country>China</country></aff><aff id="aff19"><institution>Shenzhen Campus, Sun Yat-sen University</institution><addr-line>Shenzhen</addr-line><country>China</country></aff><aff id="aff20"><institution>Fujian Maternity and Child Health Hospital, College of Clinical Medicine for Obstetrics and Gynecology and Pediatrics, Fujian Medical University</institution><addr-line>Fuzhou</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Guerrero-Contreras</surname><given-names>Gabriel</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Liu</surname><given-names>Zhi-Ping</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Huachun Zou, PhD, School of Public Health, Fudan University, Room 435, Bld #8, 130 Dongan Road, Xuhui District, Shanghai, 200032, China, 86 21 5423 7707; <email>zouhuachun@fudan.edu.cn</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>19</day><month>3</month><year>2025</year></pub-date><volume>11</volume><elocation-id>e67840</elocation-id><history><date date-type="received"><day>22</day><month>10</month><year>2024</year></date><date date-type="rev-recd"><day>29</day><month>01</month><year>2025</year></date><date date-type="accepted"><day>29</day><month>01</month><year>2025</year></date></history><copyright-statement>&#x00A9; Zhen Lu, Binhua Dong, Hongning Cai, Tian Tian, Junfeng Wang, Leiwen Fu, Bingyi Wang, Weijie Zhang, Shaomei Lin, Xunyuan Tuo, Juntao Wang, Tianjie Yang, Xinxin Huang, Zheng Zheng, Huifeng Xue, Shuxia Xu, Siyang Liu, Pengming Sun, Huachun Zou. Originally published in JMIR Public Health and Surveillance (<ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>), 19.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://publichealth.jmir.org">https://publichealth.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://publichealth.jmir.org/2025/1/e67840"/><abstract><sec><title>Background</title><p>Cervical cancer remains a major global health issue. Personalized, data-driven cervical cancer prevention (CCP) strategies tailored to phenotypic profiles may improve prevention and reduce disease burden.</p></sec><sec><title>Objective</title><p>This study aimed to identify subgroups with differential cervical precancer or cancer risks using machine learning, validate subgroup predictions across datasets, and propose a computational phenomapping strategy to enhance global CCP efforts.</p></sec><sec sec-type="methods"><title>Methods</title><p>We explored the data-driven CCP subgroups by applying unsupervised machine learning to a deeply phenotyped, population-based discovery cohort. We extracted CCP-specific risks of cervical intraepithelial neoplasia (CIN) and cervical cancer through weighted logistic regression analyses providing odds ratio (OR) estimates and 95% CIs. We trained a supervised machine learning model and developed pathways to classify individuals before evaluating its diagnostic validity and usability on an external cohort.</p></sec><sec sec-type="results"><title>Results</title><p>This study included 551,934 women (median age, 49 years) in the discovery cohort and 47,130 women (median age, 37 years) in the external cohort. Phenotyping identified 5 CCP subgroups, with CCP4 showing the highest carcinoma prevalence. CCP2&#x2013;4 had significantly higher risks of CIN2+ (CCP2: OR 2.07 [95% CI: 2.03&#x2010;2.12], CCP3: 3.88 [3.78&#x2010;3.97], and CCP4: 4.47 [4.33&#x2010;4.63]) and CIN3+ (CCP2: 2.10 [2.05&#x2010;2.14], CCP3: 3.92 [3.82&#x2010;4.02], and CCP4: 4.45 [4.31&#x2010;4.61]) compared to CCP1 (<italic>P</italic>&#x003C;.001), consistent with the direction of results observed in the external cohort. The proposed triple strategy was validated as clinically relevant, prioritizing high-risk subgroups (CCP3-4) for colposcopies and scaling human papillomavirus screening for CCP1-2.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study underscores the potential of leveraging machine learning algorithms and large-scale routine electronic health records to enhance CCP strategies. By identifying key determinants of CIN2+/CIN3+ risk and classifying 5 distinct subgroups, our study provides a robust, data-driven foundation for the proposed triple strategy. This approach prioritizes tailored prevention efforts for subgroups with varying risks, offering a novel and scalable tool to complement existing cervical cancer screening guidelines. Future work should focus on independent external and prospective validation to maximize the global impact of this strategy.</p></sec></abstract><kwd-group><kwd>cervical cancer</kwd><kwd>human papillomavirus</kwd><kwd>screening</kwd><kwd>machine learning</kwd><kwd>cervical tumor</kwd><kwd>cancer</kwd><kwd>carcinoma</kwd><kwd>tumor</kwd><kwd>malignant</kwd><kwd>ML</kwd><kwd>phenomapping strategy</kwd><kwd>logistic regression</kwd><kwd>regression</kwd><kwd>population-based</kwd><kwd>validation study</kwd><kwd>cancer prevention</kwd><kwd>validity</kwd><kwd>usability</kwd><kwd>algorithm</kwd><kwd>surveillance</kwd><kwd>electronic health record</kwd><kwd>EHR</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Cervical cancer is the fourth most common cancer among women, with an estimated 660,000 new cases and 350,000 deaths globally in 2022 [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. It is the most common cancer in 25 countries and the leading cause of cancer death in 37 countries. Despite being largely preventable through human papillomavirus (HPV) vaccination [<xref ref-type="bibr" rid="ref3">3</xref>], the high incidence and persistence of high-risk HPV (hrHPV) remain the primary risk factors for cervical cancer [<xref ref-type="bibr" rid="ref4">4</xref>] and related diseases [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. In November 2020, the World Health Organization (WHO) launched a global initiative [<xref ref-type="bibr" rid="ref8">8</xref>] to eliminate cervical cancer as a public health problem, emphasizing a triple intervention strategy: vaccinating at least 90% of girls against HPV by age 15 years, screening 70% of women with a high-performance test by ages 35 and 45 years, and treating at least 90% of detected precancerous lesions and invasive cancers. Yet, globally, an estimated 1.6 billion (67%) of 2.3 billion women aged 20&#x2010;70 years have never been screened for cervical cancer [<xref ref-type="bibr" rid="ref9">9</xref>], and in China, 5-year screening coverage among women aged 35&#x2010;49 years was only 33%. Establishing high-quality, sustainable, and acceptable cervical cancer prevention (CCP) with broad coverage in resource-limited regions remains a critical challenge [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. While HPV-based screening has demonstrated significant benefits [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref18">18</xref>], leading the WHO to recommend it as the primary method for CCP globally [<xref ref-type="bibr" rid="ref19">19</xref>], its adoption in low- and middle-income countries (LMICs) is limited due to health inequities, resource constraints, and limited access to affordable, clinically validated HPV tests [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Addressing these barriers requires personalized CCP strategies.</p><p>We hypothesize that data-driven CCP subgroups, identified using machine learning, can provide valuable insights into CCP, enabling personalized strategies to reduce the risk of cervical intraepithelial neoplasia (CIN) and cervical cancer. Personalized CCP strategies depend on the unique phenotypic profile of each individual. The population, with its varying phenotypic diversity, comprises heterogeneous subgroups that reflect multiple underlying behavior patterns and causes of disease. Clinical practice guidelines also recommend that cervical cancer screening should be tailored to an individual&#x2019;s risk profile of HPV infection [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Therefore, the discovery of CCP subgroups could inform and improve the development of new screening strategies, public health policies, and clinical decision-making, as well as contribute to trial design, despite the complex causal relationships among individual risk factors [<xref ref-type="bibr" rid="ref4">4</xref>]. To date, no study has identified CCP subgroups. The incomplete understanding of these subgroups across large, diverse populations, coupled with insufficient validation through various methods, has hindered the implementation of the triple intervention strategy. Machine learning-based approaches allow for the phenotyping of entire populations based on individual characteristics, enabling the prediction of phenotypic clusters and disease onset [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Additionally, by defining a computational phenomap&#x2014;a mathematical construct of individual phenotypes based on baseline measures [<xref ref-type="bibr" rid="ref24">24</xref>]&#x2014;computational methods can assess the heterogeneous risk effects of distinct subpopulations. This approach accounts for the phenotypic diversity within populations and their subsequent histopathological diagnoses.</p><p>As such, in this study, we aimed to: (1) test the hypothesis that distinct CCP subgroups exhibit differential risks of cervical precancer or cancer based on their complex phenotypic profiles (development); (2) demonstrate internal validity (within a dataset and across methods), as well as external and diagnostic validity (across datasets; validation); and (3) propose a computational phenomapping strategy with clinical relevance and pathways to improve global access to CCP (impact).</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Source</title><p>Deidentified data were extracted from electronic health records (EHRs) of the national cervical cancer screening program in China. In summary, our study included eligible women aged 25&#x2010;65 years who participated in the cervical cancer screening. Data from Fujian Province (2014&#x2010;2023) were used to establish a discovery cohort to train the models. Additionally, EHR data from 5 other regions&#x2014;Shenzhen City, Foshan City, Hubei Province, Gansu Province, and Guizhou Province&#x2014;were employed as an external cohort to validate the generalizability of the models across diverse populations. Details on the study design, as illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>, are available in Appendix S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Study design. (<bold>A</bold>) We explored the data-driven cervical cancer prevention (CCP) subgroups by applying unsupervised machine learning to a deeply phenotyped, population-based discovery cohort. In this population-based, external, and diagnostic validation study, we aimed to use different machine learning methods to test our hypothesis (<bold>B</bold>) that individuals within distinct CCP subgroups exhibit differential risks of cervical precancer or cancer based on their complex phenotypic profiles. After identifying CCP subgroups, we extracted CCP-specific risks of outcomes of interest (<bold>C</bold>) conditionally on all predefined and algorithmically selected features through weighted logistic regression analyses providing average odds ratio (OR) estimates. Additionally, we stratified individuals based on their key features to conduct subgroup analyses. Finally, we trained a supervised machine learning model and developed pathways (<bold>D</bold>) to classify individuals using features most consistently linked to CCP subgroups before evaluating its diagnostic validity and usability on an external cohort. Pathologically abnormal diagnoses consisted of CIN1, CIN2, CIN3, and carcinoma. UMAP: uniform manifold approximation and projection; CCP: cervical cancer prevention; LCA: latent class analysis; NILM: negative for intraepithelial lesion or malignancy; CIN1: cervical intraepithelial neoplasia grade 1; CIN2: cervical intraepithelial neoplasia grade 2; CIN3: cervical intraepithelial neoplasia grade 3; CIN2+: cervical intraepithelial neoplasia grade 2 or worse; CIN3+: cervical intraepithelial neoplasia grade 3 or worse; OR: odds ratio; XGBoost: eXtreme gradient boosting; SCREENing: clinical Subgroups for CeRvical cancEr prEvention using computational phenomaps and machine learning; hrHPV: high-risk human papillomavirus; HPV: human papillomavirus.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e67840_fig01.png"/></fig></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study was approved by the Ethics Committee of Fujian Maternal and Child Health Hospital (2023KY141). No additional informed consent was required for this analysis. All participant data were deidentified prior to analysis. No images of identifiable individuals are included in the manuscript or supplementary materials.</p></sec><sec id="s2-3"><title>Data Preprocessing</title><p>In line with the consensus that detecting and treating CIN2 or CIN3 [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], key premalignant cervical conditions, can prevent progression to invasive cervical cancer, our primary and secondary outcomes were CIN2+ and CIN3+, respectively. These outcomes were confirmed by histopathology and align with those commonly used in previous studies [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. We selected features based on prior research [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref34">34</xref>] and input from clinical, biostatistical, and epidemiological experts. These included demographic characteristics, cervical cancer screening history, HPV infection status, and medical examination results. Details on data preprocessing are provided in Appendix S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-4"><title>Unsupervised Machine Learning</title><p>We calculated phenotypic distances between individuals using Gower&#x2019;s distance [<xref ref-type="bibr" rid="ref35">35</xref>], a dissimilarity metric suitable for mixed continuous and categorical data. To visualize phenotypic variation in the population, we employed uniform manifold approximation and projection (UMAP) [<xref ref-type="bibr" rid="ref36">36</xref>] to construct a phenomap. This approach enhances interpretability by presenting the distributions of individuals within a multidimensional phenotypic space, capturing the full range of baseline phenotypes. To identify and categorize the underlying CCP subgroups in which individuals exhibit phenotypic similarity, we employed and compared 3 methods to capture and validate CCP diversity: k-means [<xref ref-type="bibr" rid="ref37">37</xref>], latent class analysis [<xref ref-type="bibr" rid="ref38">38</xref>], and UMAP [<xref ref-type="bibr" rid="ref39">39</xref>]. The final number of CCP subgroups was determined by reaching a consensus across all 3 approaches. Further details are provided in Appendix S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-5"><title>Risk Estimates and an Algorithm to Identify Subgroups</title><p>To further explore the association between CCP subgroups and outcomes of interest, we calculated CCP-specific risk estimates (odds ratios, ORs) [<xref ref-type="bibr" rid="ref40">40</xref>] and 95% CIs using inverse probability weights [<xref ref-type="bibr" rid="ref41">41</xref>]. Additionally, we trained an eXtreme gradient boosting (XGBoost) algorithm [<xref ref-type="bibr" rid="ref42">42</xref>] to predict 5 CCP subgroups with differential risks of outcomes, as described in our previous work [<xref ref-type="bibr" rid="ref23">23</xref>]. Briefly, the model was trained and calibrated using an isotonic regression algorithm, and internally validated in the discovery cohort. The SHapley Additive exPlanations (SHAP) method was employed to identify each feature&#x2019;s relative contribution [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref43">43</xref>] and enhance the model&#x2019;s explainability. Model performance was evaluated using OVR AUROC (one-versus-rest area under the receiver operating characteristics curve, extended for multiple classes), Brier score, and calibration curves as primary metrics. In external validation, the model&#x2019;s diagnostic validity was assessed by comparing CCP-specific ORs between datasets to evaluate cross-cluster and cross-dataset risk differences. Further details are provided in Appendix S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-6"><title>Developing Pathways to Improve Impact</title><p>We named our computational phenomapping strategy SCREENing (clinical Subgroups for CeRvical cancEr prEvention using computational pheNomaps and machine learnING). To assess real-world usability and effectiveness, we consulted 11 clinical experts and 3 epidemiologists on its clinical relevance, justification, result interpretability, and potential impact on screening strategies and public health policymaking.</p></sec><sec id="s2-7"><title>Statistical Analysis</title><p>Given the importance of menopause in women, we specifically examined CCP-specific risks across age using spline analyses, with interaction tests to assess whether age modified these risks. Subgroup analyses were also performed by stratifying women based on key features. Details are provided in Appendix S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We followed the Guidelines for Developing and Reporting Machine Learning Predictive Models in Biomedical Research [<xref ref-type="bibr" rid="ref44">44</xref>] and the Transparent Reporting of a multivariable prediction model for Individual Prognosis or Diagnosis statement [<xref ref-type="bibr" rid="ref45">45</xref>]. Data management was performed using the lulab.utils R package [<xref ref-type="bibr" rid="ref46">46</xref>]. All analyses [<xref ref-type="bibr" rid="ref47">47</xref>] were conducted using Python (version 3.11.6), SAS Enterprise Guide (version 7.1), and R (version 4.3.2; R Foundation for Statistical Computing).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Characteristics of Cohorts</title><p>The study included 551,934 women (median age 49 years [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]; 10% infected with hrHPV, 1.2% with HPV-16, and 0.6% with HPV-18) in the discovery cohort (<xref ref-type="table" rid="table1">Table 1</xref>) and 47,130 women (median age 37 years [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]; 16.6% with hrHPV, 3.9% with HPV-16, and 1.4% with HPV-18) in the external cohort (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). In the discovery cohort, 9932 were pathologically diagnosed with cervical abnormalities, including 533 with carcinoma. In contrast, the external cohort showed a higher prevalence of cervical abnormalities at 11.1% (5251).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Characteristics by cervical cancer prevention (CCP) subgroups in the discovery cohort. Categorical features are summarized as numbers (percentages), and continuous features as median (Q1, Q3), as appropriate.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">CCP0<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup><break/>(n=542,002)</td><td align="left" valign="bottom">CCP1<break/>(n=2242)</td><td align="left" valign="bottom">CCP2<break/>(n=3770)</td><td align="left" valign="bottom">CCP3<break/>(n=2278)</td><td align="left" valign="bottom">CCP4<break/>(n=1642)</td><td align="left" valign="bottom">Total<break/>(n=551,934)</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), median (Q1, Q3)</td><td align="left" valign="top">48.00 (42.00, 54.00)</td><td align="left" valign="top">48.00 (42.00, 54.00)</td><td align="left" valign="top">48.00 (43.00, 55.00)</td><td align="left" valign="top">51.00 (44.00, 57.00)</td><td align="left" valign="top">48.00 (43.00, 54.00)</td><td align="left" valign="top">49.00 (42.00, 54.00)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Race/ethnicity, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;Han</td><td align="left" valign="top">534,023 (98.53)</td><td align="left" valign="top">2214 (98.75)</td><td align="left" valign="top">3707 (98.33)</td><td align="left" valign="top">2236 (98.16)</td><td align="left" valign="top">1607 (97.87)</td><td align="left" valign="top">543,787 (98.52)</td></tr><tr><td align="left" valign="top">&#x2003;Others</td><td align="left" valign="top">4528 (0.84)</td><td align="left" valign="top">15 (0.67)</td><td align="left" valign="top">30 (0.80)</td><td align="left" valign="top">29 (1.27)</td><td align="left" valign="top">20 (1.22)</td><td align="left" valign="top">4622 (0.84)</td></tr><tr><td align="left" valign="top">&#x2003;Missing</td><td align="left" valign="top">3451 (0.64)</td><td align="left" valign="top">13 (0.58)</td><td align="left" valign="top">33 (0.88)</td><td align="left" valign="top">13 (0.57)</td><td align="left" valign="top">15 (0.91)</td><td align="left" valign="top">3525 (0.64)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>History of cervical cancer screening, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;Missing</td><td align="left" valign="top">234 (0.04)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">2 (0.05)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">236 (0.04)</td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">411,029 (75.84)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">3768 (99.95)</td><td align="left" valign="top">2278 (100.00)</td><td align="left" valign="top">1642 (100.00)</td><td align="left" valign="top">418,717 (75.86)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">130,739 (24.12)</td><td align="left" valign="top">2242 (100.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">132,981 (24.09)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Time of previous screening, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;Missing</td><td align="left" valign="top">785 (0.14)</td><td align="left" valign="top">13 (0.58)</td><td align="left" valign="top">2 (0.05)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">800 (0.14)</td></tr><tr><td align="left" valign="top">&#x2003;No previous screening</td><td align="left" valign="top">411,029 (75.84)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">3768 (99.95)</td><td align="left" valign="top">2278 (100.00)</td><td align="left" valign="top">1642 (100.00)</td><td align="left" valign="top">418,717 (75.86)</td></tr><tr><td align="left" valign="top">&#x2003;Within 3 years from now</td><td align="left" valign="top">65,519 (12.09)</td><td align="left" valign="top">1091 (48.66)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">66,610 (12.07)</td></tr><tr><td align="left" valign="top">&#x2003;More than 3 years ago</td><td align="left" valign="top">64,669 (11.93)</td><td align="left" valign="top">1138 (50.76)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">65,807 (11.92)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Gynecological examination, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;Missing</td><td align="left" valign="top">2180 (0.40)</td><td align="left" valign="top">1 (0.04)</td><td align="left" valign="top">1 (0.03)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">2182 (0.40)</td></tr><tr><td align="left" valign="top">&#x2003;Normal</td><td align="left" valign="top">417,921 (77.11)</td><td align="left" valign="top">1508 (67.26)</td><td align="left" valign="top">3763 (99.81)</td><td align="left" valign="top">1568 (68.83)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">424,760 (76.96)</td></tr><tr><td align="left" valign="top">&#x2003;Abnormal</td><td align="left" valign="top">121,901 (22.49)</td><td align="left" valign="top">733 (32.69)</td><td align="left" valign="top">6 (0.16)</td><td align="left" valign="top">710 (31.17)</td><td align="left" valign="top">1642 (100.00)</td><td align="left" valign="top">124,992 (22.65)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for high-risk HPV</bold><sup><xref ref-type="table-fn" rid="table1fn1">b, c</xref></sup><bold>, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">496,234 (91.56)</td><td align="left" valign="top">99 (4.42)</td><td align="left" valign="top">206 (5.46)</td><td align="left" valign="top">27 (1.19)</td><td align="left" valign="top">67 (4.08)</td><td align="left" valign="top">496,633 (89.98)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">45,768 (8.44)</td><td align="left" valign="top">2143 (95.58)</td><td align="left" valign="top">3564 (94.54)</td><td align="left" valign="top">2251 (98.81)</td><td align="left" valign="top">1575 (95.92)</td><td align="left" valign="top">55,301 (10.02)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for low-risk HPV</bold><sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup><bold>, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">534,313 (98.58)</td><td align="left" valign="top">2035 (90.77)</td><td align="left" valign="top">3664 (97.19)</td><td align="left" valign="top">1813 (79.59)</td><td align="left" valign="top">1602 (97.56)</td><td align="left" valign="top">543,427 (98.46)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">7689 (1.42)</td><td align="left" valign="top">207 (9.23)</td><td align="left" valign="top">106 (2.81)</td><td align="left" valign="top">465 (20.41)</td><td align="left" valign="top">40 (2.44)</td><td align="left" valign="top">8507 (1.54)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for possible high-risk HPV</bold><sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup><bold>, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">537,999 (99.26)</td><td align="left" valign="top">2130 (95.00)</td><td align="left" valign="top">3686 (97.77)</td><td align="left" valign="top">1987 (87.23)</td><td align="left" valign="top">1617 (98.48)</td><td align="left" valign="top">547,419 (99.18)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">4003 (0.74)</td><td align="left" valign="top">112 (5.00)</td><td align="left" valign="top">84 (2.23)</td><td align="left" valign="top">291 (12.77)</td><td align="left" valign="top">25 (1.52)</td><td align="left" valign="top">4515 (0.82)</td></tr><tr><td align="left" valign="top">Number of HPV infections</td><td align="left" valign="top">0.00 (0.00, 0.00)</td><td align="left" valign="top">1.00 (1.00, 2.00)</td><td align="left" valign="top">1.00 (1.00, 1.00)</td><td align="left" valign="top">2.00 (2.00, 3.00)</td><td align="left" valign="top">1.00 (1.00, 1.00)</td><td align="left" valign="top">0.00 (0.00, 0.00)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-16, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">538,375 (99.33)</td><td align="left" valign="top">1684 (75.11)</td><td align="left" valign="top">2745 (72.81)</td><td align="left" valign="top">1494 (65.58)</td><td align="left" valign="top">1199 (73.02)</td><td align="left" valign="top">545,497 (98.83)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">3627 (0.67)</td><td align="left" valign="top">558 (24.89)</td><td align="left" valign="top">1025 (27.19)</td><td align="left" valign="top">784 (34.42)</td><td align="left" valign="top">443 (26.98)</td><td align="left" valign="top">6437 (1.17)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-18, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">539,716 (99.58)</td><td align="left" valign="top">2002 (89.30)</td><td align="left" valign="top">3442 (91.30)</td><td align="left" valign="top">1887 (82.84)</td><td align="left" valign="top">1508 (91.84)</td><td align="left" valign="top">548,555 (99.39)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">2286 (0.42)</td><td align="left" valign="top">240 (10.70)</td><td align="left" valign="top">328 (8.70)</td><td align="left" valign="top">391 (17.16)</td><td align="left" valign="top">134 (8.16)</td><td align="left" valign="top">3379 (0.61)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-31, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,143 (99.66)</td><td align="left" valign="top">2138 (95.36)</td><td align="left" valign="top">3662 (97.14)</td><td align="left" valign="top">2063 (90.56)</td><td align="left" valign="top">1588 (96.71)</td><td align="left" valign="top">549,594 (99.58)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1859 (0.34)</td><td align="left" valign="top">104 (4.64)</td><td align="left" valign="top">108 (2.86)</td><td align="left" valign="top">215 (9.44)</td><td align="left" valign="top">54 (3.29)</td><td align="left" valign="top">2340 (0.42)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-33, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">539,290 (99.50)</td><td align="left" valign="top">2096 (93.49)</td><td align="left" valign="top">3608 (95.70)</td><td align="left" valign="top">1978 (86.83)</td><td align="left" valign="top">1562 (95.13)</td><td align="left" valign="top">548,534 (99.38)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">2712 (0.50)</td><td align="left" valign="top">146 (6.51)</td><td align="left" valign="top">162 (4.30)</td><td align="left" valign="top">300 (13.17)</td><td align="left" valign="top">80 (4.87)</td><td align="left" valign="top">3400 (0.62)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-35, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,820 (99.78)</td><td align="left" valign="top">2197 (97.99)</td><td align="left" valign="top">3708 (98.36)</td><td align="left" valign="top">2160 (94.82)</td><td align="left" valign="top">1622 (98.78)</td><td align="left" valign="top">550,507 (99.74)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1182 (0.22)</td><td align="left" valign="top">45 (2.01)</td><td align="left" valign="top">62 (1.64)</td><td align="left" valign="top">118 (5.18)</td><td align="left" valign="top">20 (1.22)</td><td align="left" valign="top">1427 (0.26)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-39, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">537,675 (99.20)</td><td align="left" valign="top">2092 (93.31)</td><td align="left" valign="top">3638 (96.50)</td><td align="left" valign="top">2021 (88.72)</td><td align="left" valign="top">1600 (97.44)</td><td align="left" valign="top">547,026 (99.11)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">4327 (0.80)</td><td align="left" valign="top">150 (6.69)</td><td align="left" valign="top">132 (3.50)</td><td align="left" valign="top">257 (11.28)</td><td align="left" valign="top">42 (2.56)</td><td align="left" valign="top">4908 (0.89)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-45, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,998 (99.81)</td><td align="left" valign="top">2205 (98.35)</td><td align="left" valign="top">3741 (99.23)</td><td align="left" valign="top">2204 (96.75)</td><td align="left" valign="top">1632 (99.39)</td><td align="left" valign="top">550,780 (99.79)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1004 (0.19)</td><td align="left" valign="top">37 (1.65)</td><td align="left" valign="top">29 (0.77)</td><td align="left" valign="top">74 (3.25)</td><td align="left" valign="top">10 (0.61)</td><td align="left" valign="top">1154 (0.21)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-51, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">537,654 (99.20)</td><td align="left" valign="top">2053 (91.57)</td><td align="left" valign="top">3590 (95.23)</td><td align="left" valign="top">1954 (85.78)</td><td align="left" valign="top">1565 (95.31)</td><td align="left" valign="top">546,816 (99.07)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">4348 (0.80)</td><td align="left" valign="top">189 (8.43)</td><td align="left" valign="top">180 (4.77)</td><td align="left" valign="top">324 (14.22)</td><td align="left" valign="top">77 (4.69)</td><td align="left" valign="top">5118 (0.93)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-52, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">525,904 (97.03)</td><td align="left" valign="top">1622 (72.35)</td><td align="left" valign="top">3019 (80.08)</td><td align="left" valign="top">1396 (61.28)</td><td align="left" valign="top">1276 (77.71)</td><td align="left" valign="top">533,217 (96.61)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">16,098 (2.97)</td><td align="left" valign="top">620 (27.65)</td><td align="left" valign="top">751 (19.92)</td><td align="left" valign="top">882 (38.72)</td><td align="left" valign="top">366 (22.29)</td><td align="left" valign="top">18,717 (3.39)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-56, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">539,439 (99.53)</td><td align="left" valign="top">2133 (95.14)</td><td align="left" valign="top">3682 (97.67)</td><td align="left" valign="top">2076 (91.13)</td><td align="left" valign="top">1610 (98.05)</td><td align="left" valign="top">548,940 (99.46)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">2563 (0.47)</td><td align="left" valign="top">109 (4.86)</td><td align="left" valign="top">88 (2.33)</td><td align="left" valign="top">202 (8.87)</td><td align="left" valign="top">32 (1.95)</td><td align="left" valign="top">2994 (0.54)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-58, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">534,764 (98.66)</td><td align="left" valign="top">1877 (83.72)</td><td align="left" valign="top">3297 (87.45)</td><td align="left" valign="top">1691 (74.23)</td><td align="left" valign="top">1413 (86.05)</td><td align="left" valign="top">543,042 (98.39)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">7238 (1.34)</td><td align="left" valign="top">365 (16.28)</td><td align="left" valign="top">473 (12.55)</td><td align="left" valign="top">587 (25.77)</td><td align="left" valign="top">229 (13.95)</td><td align="left" valign="top">8892 (1.61)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-59, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,034 (99.64)</td><td align="left" valign="top">2180 (97.23)</td><td align="left" valign="top">3710 (98.41)</td><td align="left" valign="top">2124 (93.24)</td><td align="left" valign="top">1620 (98.66)</td><td align="left" valign="top">549,668 (99.59)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1968 (0.36)</td><td align="left" valign="top">62 (2.77)</td><td align="left" valign="top">60 (1.59)</td><td align="left" valign="top">154 (6.76)</td><td align="left" valign="top">22 (1.34)</td><td align="left" valign="top">2266 (0.41)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-66, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,640 (99.75)</td><td align="left" valign="top">2186 (97.50)</td><td align="left" valign="top">3720 (98.67)</td><td align="left" valign="top">2180 (95.70)</td><td align="left" valign="top">1614 (98.29)</td><td align="left" valign="top">550,340 (99.71)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1362 (0.25)</td><td align="left" valign="top">56 (2.50)</td><td align="left" valign="top">50 (1.33)</td><td align="left" valign="top">98 (4.30)</td><td align="left" valign="top">28 (1.71)</td><td align="left" valign="top">1594 (0.29)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-68, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">538,250 (99.31)</td><td align="left" valign="top">2124 (94.74)</td><td align="left" valign="top">3654 (96.92)</td><td align="left" valign="top">2018 (88.59)</td><td align="left" valign="top">1604 (97.69)</td><td align="left" valign="top">547,650 (99.22)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">3752 (0.69)</td><td align="left" valign="top">118 (5.26)</td><td align="left" valign="top">116 (3.08)</td><td align="left" valign="top">260 (11.41)</td><td align="left" valign="top">38 (2.31)</td><td align="left" valign="top">4284 (0.78)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-11, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">541,435 (99.90)</td><td align="left" valign="top">2218 (98.93)</td><td align="left" valign="top">3764 (99.84)</td><td align="left" valign="top">2235 (98.11)</td><td align="left" valign="top">1631 (99.33)</td><td align="left" valign="top">551,283 (99.88)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">567 (0.10)</td><td align="left" valign="top">24 (1.07)</td><td align="left" valign="top">6 (0.16)</td><td align="left" valign="top">43 (1.89)</td><td align="left" valign="top">11 (0.67)</td><td align="left" valign="top">651 (0.12)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-42, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,587 (99.74)</td><td align="left" valign="top">2199 (98.08)</td><td align="left" valign="top">3745 (99.34)</td><td align="left" valign="top">2175 (95.48)</td><td align="left" valign="top">1639 (99.82)</td><td align="left" valign="top">550,345 (99.71)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1415 (0.26)</td><td align="left" valign="top">43 (1.92)</td><td align="left" valign="top">25 (0.66)</td><td align="left" valign="top">103 (4.52)</td><td align="left" valign="top">3 (0.18)</td><td align="left" valign="top">1589 (0.29)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-43, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">541,315 (99.87)</td><td align="left" valign="top">2212 (98.66)</td><td align="left" valign="top">3759 (99.71)</td><td align="left" valign="top">2210 (97.01)</td><td align="left" valign="top">1641 (99.94)</td><td align="left" valign="top">551,137 (99.86)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">687 (0.13)</td><td align="left" valign="top">30 (1.34)</td><td align="left" valign="top">11 (0.29)</td><td align="left" valign="top">68 (2.99)</td><td align="left" valign="top">1 (0.06)</td><td align="left" valign="top">797 (0.14)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-44, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,505 (99.72)</td><td align="left" valign="top">2212 (98.66)</td><td align="left" valign="top">3753 (99.55)</td><td align="left" valign="top">2201 (96.62)</td><td align="left" valign="top">1636 (99.63)</td><td align="left" valign="top">550,307 (99.71)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1497 (0.28)</td><td align="left" valign="top">30 (1.34)</td><td align="left" valign="top">17 (0.45)</td><td align="left" valign="top">77 (3.38)</td><td align="left" valign="top">6 (0.37)</td><td align="left" valign="top">1627 (0.29)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-6, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">540,748 (99.77)</td><td align="left" valign="top">2207 (98.44)</td><td align="left" valign="top">3748 (99.42)</td><td align="left" valign="top">2199 (96.53)</td><td align="left" valign="top">1635 (99.57)</td><td align="left" valign="top">550,537 (99.75)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">1254 (0.23)</td><td align="left" valign="top">35 (1.56)</td><td align="left" valign="top">22 (0.58)</td><td align="left" valign="top">79 (3.47)</td><td align="left" valign="top">7 (0.43)</td><td align="left" valign="top">1397 (0.25)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-81, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">539,354 (99.51)</td><td align="left" valign="top">2178 (97.15)</td><td align="left" valign="top">3747 (99.39)</td><td align="left" valign="top">2136 (93.77)</td><td align="left" valign="top">1632 (99.39)</td><td align="left" valign="top">549,047 (99.48)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">2648 (0.49)</td><td align="left" valign="top">64 (2.85)</td><td align="left" valign="top">23 (0.61)</td><td align="left" valign="top">142 (6.23)</td><td align="left" valign="top">10 (0.61)</td><td align="left" valign="top">2887 (0.52)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Positive for HPV-53, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">538,445 (99.34)</td><td align="left" valign="top">2139 (95.41)</td><td align="left" valign="top">3689 (97.85)</td><td align="left" valign="top">2015 (88.45)</td><td align="left" valign="top">1617 (98.48)</td><td align="left" valign="top">547,905 (99.27)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">3557 (0.66)</td><td align="left" valign="top">103 (4.59)</td><td align="left" valign="top">81 (2.15)</td><td align="left" valign="top">263 (11.55)</td><td align="left" valign="top">25 (1.52)</td><td align="left" valign="top">4029 (0.73)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Cervical cytology examination, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;NILM<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">42,746 (7.89)</td><td align="left" valign="top">489 (21.81)</td><td align="left" valign="top">721 (19.12)</td><td align="left" valign="top">438 (19.23)</td><td align="left" valign="top">345 (21.01)</td><td align="left" valign="top">44,739 (8.11)</td></tr><tr><td align="left" valign="top">&#x2003;No examination due to negative for high-risk HPV</td><td align="left" valign="top">487,235 (89.90)</td><td align="left" valign="top">3 (0.13)</td><td align="left" valign="top">7 (0.19)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">487,245 (88.28)</td></tr><tr><td align="left" valign="top">&#x2003;ASC-US<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">7577 (1.40)</td><td align="left" valign="top">808 (36.04)</td><td align="left" valign="top">1185 (31.43)</td><td align="left" valign="top">721 (31.65)</td><td align="left" valign="top">531 (32.34)</td><td align="left" valign="top">10822 (1.96)</td></tr><tr><td align="left" valign="top">&#x2003;LSIL<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">2245 (0.41)</td><td align="left" valign="top">488 (21.77)</td><td align="left" valign="top">772 (20.48)</td><td align="left" valign="top">546 (23.97)</td><td align="left" valign="top">286 (17.42)</td><td align="left" valign="top">4337 (0.79)</td></tr><tr><td align="left" valign="top">&#x2003;AGC<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="left" valign="top">99 (0.02)</td><td align="left" valign="top">18 (0.80)</td><td align="left" valign="top">29 (0.77)</td><td align="left" valign="top">13 (0.57)</td><td align="left" valign="top">30 (1.83)</td><td align="left" valign="top">189 (0.03)</td></tr><tr><td align="left" valign="top">&#x2003;Missing but positive for high-risk HPV</td><td align="left" valign="top">779 (0.14)</td><td align="left" valign="top">99 (4.42)</td><td align="left" valign="top">231 (6.13)</td><td align="left" valign="top">159 (6.98)</td><td align="left" valign="top">81 (4.93)</td><td align="left" valign="top">1349 (0.24)</td></tr><tr><td align="left" valign="top">&#x2003;ASC-H<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td><td align="left" valign="top">902 (0.17)</td><td align="left" valign="top">147 (6.56)</td><td align="left" valign="top">363 (9.63)</td><td align="left" valign="top">163 (7.16)</td><td align="left" valign="top">145 (8.83)</td><td align="left" valign="top">1720 (0.31)</td></tr><tr><td align="left" valign="top">&#x2003;AGC-FN<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></td><td align="left" valign="top">7 (0.00)</td><td align="left" valign="top">4 (0.18)</td><td align="left" valign="top">9 (0.24)</td><td align="left" valign="top">3 (0.13)</td><td align="left" valign="top">6 (0.37)</td><td align="left" valign="top">29 (0.01)</td></tr><tr><td align="left" valign="top">&#x2003;HSIL<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="left" valign="top">411 (0.08)</td><td align="left" valign="top">185 (8.25)</td><td align="left" valign="top">443 (11.75)</td><td align="left" valign="top">233 (10.23)</td><td align="left" valign="top">215 (13.09)</td><td align="left" valign="top">1487 (0.27)</td></tr><tr><td align="left" valign="top">&#x2003;Carcinoma</td><td align="left" valign="top">1 (0.00)</td><td align="left" valign="top">1 (0.04)</td><td align="left" valign="top">10 (0.27)</td><td align="left" valign="top">2 (0.09)</td><td align="left" valign="top">3 (0.18)</td><td align="left" valign="top">17 (0.00)</td></tr><tr><td align="left" valign="top" colspan="7"><bold>Histopathological diagnosis, n (%)</bold></td></tr><tr><td align="left" valign="top">&#x2003;NILM</td><td align="left" valign="top">542,002 (100.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">542,002 (98.20)</td></tr><tr><td align="left" valign="top">&#x2003;CIN1<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1542 (68.78)</td><td align="left" valign="top">2456 (65.15)</td><td align="left" valign="top">1445 (63.43)</td><td align="left" valign="top">948 (57.73)</td><td align="left" valign="top">6391 (1.16)</td></tr><tr><td align="left" valign="top">&#x2003;CIN2<sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup></td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">22 (0.98)</td><td align="left" valign="top">29 (0.77)</td><td align="left" valign="top">15 (0.66)</td><td align="left" valign="top">16 (0.97)</td><td align="left" valign="top">82 (0.01)</td></tr><tr><td align="left" valign="top">&#x2003;CIN2/3<sup><xref ref-type="table-fn" rid="table1fn15">o</xref></sup></td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">551 (24.58)</td><td align="left" valign="top">1113 (29.52)</td><td align="left" valign="top">716 (31.43)</td><td align="left" valign="top">485 (29.54)</td><td align="left" valign="top">2865 (0.52)</td></tr><tr><td align="left" valign="top">&#x2003;CIN3<sup><xref ref-type="table-fn" rid="table1fn16">p</xref></sup></td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">16 (0.71)</td><td align="left" valign="top">19 (0.50)</td><td align="left" valign="top">13 (0.57)</td><td align="left" valign="top">13 (0.79)</td><td align="left" valign="top">61 (0.01)</td></tr><tr><td align="left" valign="top">&#x2003;Carcinoma</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">111 (4.95)</td><td align="left" valign="top">153 (4.06)</td><td align="left" valign="top">89 (3.91)</td><td align="left" valign="top">180 (10.96)</td><td align="left" valign="top">533 (0.10)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>CCP: cervical cancer prevention.</p></fn><fn id="table1fn2"><p><sup>b</sup>HPV: human papillomavirus.</p></fn><fn id="table1fn3"><p><sup>c</sup>high-risk HPV: HPV-16/18/31/33/35/39/45/51/52/56/58/59/66/68.</p></fn><fn id="table1fn4"><p><sup>d</sup>low-risk HPV: HPV-11/40/42/43/44/6/61/72/81.</p></fn><fn id="table1fn5"><p><sup>e</sup>possible high-risk HPV: HPV-53/70/73/82/83.</p></fn><fn id="table1fn6"><p><sup>f</sup>NILM: negative for intraepithelial lesion or malignancy.</p></fn><fn id="table1fn7"><p><sup>g</sup>ASC-US: atypical squamous cells of undetermined significance.</p></fn><fn id="table1fn8"><p><sup>h</sup>LSIL: low-grade squamous intraepithelial lesion.</p></fn><fn id="table1fn9"><p><sup>i</sup>AGC: atypical glandular cells.</p></fn><fn id="table1fn10"><p><sup>j</sup>ASC-H: atypical squamous cells, cannot exclude high-grade squamous intraepithelial lesion.</p></fn><fn id="table1fn11"><p><sup>k</sup>AGC-FN: AGC-favor neoplastic.</p></fn><fn id="table1fn12"><p><sup>l</sup>HSIL: high-grade squamous intraepithelial lesion.</p></fn><fn id="table1fn13"><p><sup>m</sup>CIN1: cervical intraepithelial neoplasia grade 1.</p></fn><fn id="table1fn14"><p><sup>n</sup>CIN2: cervical intraepithelial neoplasia grade 2.</p></fn><fn id="table1fn15"><p><sup>o</sup>CIN2/3 is reflective of CIN2 or CIN3, i.e., HSIL; carcinoma consists of AIS (adenocarcinoma in situ) and cancer.</p></fn><fn id="table1fn16"><p><sup>p</sup>CIN3: cervical intraepithelial neoplasia grade 3.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Data-Driven Subgroups</title><p>The discovery cohort was extensively phenotyped based on 31 features (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Visual assessment of the risk phenomaps revealed that nearly all 6 features were heterogeneously distributed in the phenomic space to varying degrees, indicating distinct phenotypic neighborhoods. In the discovery cohort, the CCP subgroups identified across 3 algorithms and all metrics were stable (<xref ref-type="fig" rid="figure3">Figure 3A</xref> and Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), with the optimal number of clusters being 4 in the subpopulation of 9932 women with cervical abnormalities. The distribution of cervical abnormalities across subgroups is presented in <xref ref-type="fig" rid="figure3">Figure 3B</xref>. Additionally, women with normal screening results were treated as another CCP subgroup (<xref ref-type="table" rid="table1">Table 1</xref>). Following a detailed analysis of each subgroup&#x2019;s features, we labeled the 5 identified subgroups as follows: (0) healthy, (1) early onset, (2) screening-targeted, (3) late onset, and (4) carcinoma-specific. CCP1 had the highest prevalence of CIN1, while CCP4 had the highest prevalence of carcinoma (<xref ref-type="fig" rid="figure3">Figure 3C</xref>). Most features were able to discriminate well between the subgroups. In the external cohort, the subgroups were consistent (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), though CCP1 was not identified due to missing information on previous screenings. The distribution of subgroups was similar across the discovery and external cohorts, with CCP0 being the most common subgroup and CCP4 having the highest prevalence of carcinoma.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Manifold representations of the phenotypic architecture of 9932 individuals pathologically diagnosed with cervical abnormality from the discovery cohort (N=551,934). A total of 9932 individuals are embedded in the phenotypic space based on dissimilarity metrics (Gower&#x2019;s distance) derived from 31 included phenotypic features; thus, phenotypically similar women tend to be topologically closer. In the subfigures, each dot represents an individual, with coloring based on the value of features. Since the dimensionality reduction is nonlinear, axes have been omitted, and only the comparisons between distances are meaningful. Pathologically abnormal diagnoses consisted of CIN1, CIN2, CIN3, and carcinoma. 14 high-risk HPV: HPV-16/18/31/33/35/39/45/51/52/56/58/59/66/68; low-risk HPV: HPV-11/40/42/43/44/6/61/72/81; possible high-risk HPV: HPV- 53/70/73/82/83.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e67840_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Determination of the 5 CCP subgroups with differential risks of CIN2+/CIN3+. (<bold>A</bold>) Elbow plot to determine the optimal number of clusters. Across 3 algorithms (k-means, LCA, and UMAP), identified CCP subgroups were stable, with the optimal number of clusters being 4 in 9932 women pathologically diagnosed with cervical abnormality. Women with normal screening test findings were considered as one independent CCP subgroup free of cervical cancer (<xref ref-type="table" rid="table1">Table 1</xref>). (<bold>B</bold>) Relative prevalence of pathologically abnormal diagnoses across CCP subgroups. For each pathologically abnormal diagnosis, the highest prevalence was designated as 100%, and the prevalence in each of the other CCP subgroups was relative to that prevalence (0&#x2010;100). (<bold>C</bold>) Characteristics of CCP subgroups. (<bold>D</bold>) CCP-specific risk estimates of CIN2+/CIN3+ compared with the CCP1 subgroup. Adjusted ORs (dots) and 95% CIs (error bars) are presented. The dashed line marks an OR of 1.00; lower limits of 95% CIs with values greater than 1.00 indicate significantly increased risk. (<bold>E</bold>) The CCP-specific risks of CIN2+/CIN3+ across age compared with the CCP1 subgroup. Age was transformed into a restricted cubic spline function for the analyses. <italic>P</italic> value was based on 2-sided Chi-squared test on the interaction between age and CCP subgroups. A <italic>P</italic> value of &#x003C;.05 suggests that age modifies the association between CCP subgroups and CIN2+/CIN3+. Light-colored bands represent 95% CIs. (<bold>F</bold>) Subgroup analyses of CCP-specific risk estimates of CIN2+/CIN3+ compared with the CCP1 subgroup. Adjusted ORs (dots) and 95% CIs (error bars) are presented. The dashed line marks an OR of 1.00; lower limits of 95% CIs with values greater than 1.00 indicate significantly increased risk. Empty subfigures suggest insufficient samples for the analysis. AIC: Akaike information criterion; BIC: Bayesian information criterion; SABIC: sample size-adjusted BIC; CCP: cervical cancer prevention; CIN1: cervical intraepithelial neoplasia grade 1; CIN2: cervical intraepithelial neoplasia grade 2; CIN3: cervical intraepithelial neoplasia grade 3; CIN2+: cervical intraepithelial neoplasia grade 2 or worse; CIN3+: cervical intraepithelial neoplasia grade 3 or worse; OR: odds ratio; hrHPV: high-risk human papillomavirus.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e67840_fig03.png"/></fig></sec><sec id="s3-3"><title>Risk Estimates and Diagnostic Validity</title><p>In the diagnostic validity analysis of the discovery cohort (<xref ref-type="fig" rid="figure3">Figure 3D</xref>), women in CCP2-4 exhibited a significantly increased risk of both CIN2+ (CCP2: OR 2.07, 95% CI [2.03&#x2010;2.12]; CCP3: 3.88 [3.78&#x2010;3.97]; CCP4: 4.47 [4.33&#x2010;4.63]) and CIN3+ (2.10 [2.05&#x2010;2.14]; 3.92 [3.82&#x2010;4.02]; 4.45 [4.31&#x2010;4.61]) compared to CCP1. Risk analysis across age groups showed that the risks for CIN2+/CIN3+ were evident in the age ranges of 34&#x2010;47 and 60&#x2010;65 in CCP2, 26&#x2010;61 in CCP3, and 35&#x2010;60 in CCP4, respectively (<xref ref-type="fig" rid="figure3">Figure 3E</xref>). Interaction analyses between age and subgroups revealed that the risks of CIN2+/CIN3+ increased with age in the 34&#x2010;39 and 60&#x2010;65 age ranges in CCP2, in the 35-43/44 age range in CCP4. Conversely, the risks decreased with age in CCP2 within the 40&#x2010;47 age range and in CCP4 within the 45&#x2010;60 age range (all <italic>P</italic> for interaction &#x003C;.001). Subgroup analyses indicated that the risks for CIN2+/CIN3+ were present across nearly all subgroups, categorized by age, race, gynecological examination, screening history, hrHPV infection, and number of infections (<xref ref-type="fig" rid="figure3">Figure 3F</xref> and Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>SHAP analysis identified the top 10 key features for prediction, including the number of infections, screening history, gynecological examination, hrHPV infection, cervical cytology, time since previous screening, HPV-16/18 infection, age, and possible hrHPV infection (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). The final XGBoost model demonstrated excellent discrimination (OVR AUROC 0.995 [0.994&#x2010;0.996]), with CCP0 showing the lowest AUROC of 0.987 [0.985&#x2010;0.989], and strong calibration (Brier score 0.021 [0.020&#x2010;0.022]) (<xref ref-type="fig" rid="figure4">Figure 4B&#x2013;C</xref> and Table S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For the external diagnostic validity of the identified subgroups, women in CCP2-4 showed differential and increased risk for both CIN2+ (CCP2: 5.54 [3.27&#x2010;8.86]; CCP3&#x0026;4: 26.56 [24.44&#x2010;28.88]) and CIN3+ (7.53 [3.90&#x2010;13.18]; 29.47 [26.46&#x2010;32.86]) compared to CCP0. The cross-cluster risk differences were consistent across the discovery and external cohorts. To illustrate the model&#x2019;s explainability, <xref ref-type="fig" rid="figure4">Figure 4D</xref> presents the SHAP plot for a woman in the CCP4 subgroup, who had no previous screening and tested positive for HPV-16 and CIN1 based on cervical cytology. Given this information, our model predicted an elevated risk of CCP4. Additionally, a screenshot of our browser-accessible tool based on the model developed in this study, to clarify how the model can be easily accessed via a browser in clinical settings, is shown in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Feature importance, discrimination, calibration, explainability, and external diagnostic validity. (<bold>A</bold>) The top 20 features for prediction of CCP subgroups with differential risks of CIN2+/CIN3+ are shown. The y-axis represents the features included in the model development (in descending order of importance), and the x-axis indicates the mean of SHAP values. The 10 most important features were selected to train the final parsimonious model. (<bold>B</bold>) ROC curves in the internal validation from the discovery cohort. The dark purple line represents the macro-average of all 5 CCP subgroups. (<bold>C</bold>) Calibration curve of the alignment between predicted and observed CCP subgroups for the final model. The solid line corresponds to the calibration curve, with the dashed line corresponding to a reference for perfect calibration (ie, perfect alignment between the predicted and observed probabilities). (<bold>D</bold>) Explanation of the SCREENing tool (ie, the inference process of the final model with a woman in the CCP4 subgroup). (<bold>E</bold>) In external validation, to assess cross-cluster and cross-dataset risk differences, the model was measured and compared by diagnostic validity (CCP-specific ORs) between datasets. CCP: cervical cancer prevention; hrHPV: high-risk human papillomavirus; lrHPV: low-risk human papillomavirus; SHAP: SHapley Additive exPlanations; AUC: area under receiver operating characteristics curve; XGBoost: eXtreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="publichealth_v11i1e67840_fig04.png"/></fig></sec><sec id="s3-4"><title>Developed Pathways</title><p>Based on our analyses, we proposed a triple SCREENing strategy to prioritize CCP subgroups with varying CIN2+/CIN3+ risks: (1) top priority for colposcopy referrals to women in CCP3-4 in resource-constrained settings, (2) higher priority given for scaling up organized, population-based HPV screening programs (with adequate follow-up) for women in CCP1-2, and (3) lowest priority for CCP0 women, with large-scale screening limited to resource-rich settings. To assess its impact, we evaluated the real-world usability and effectiveness of SCREENing. Sample clinicians reported that the identified subgroups and included features were clinically relevant for risk-based cervical cancer management, particularly for colposcopy referrals in CCP3-4. They also found the strategy transparent, interpretable, and generalizable across clinical settings, with the browser-accessible model feasible and effective for indicating risk probabilities during consultations. Sample epidemiologists highlighted the strategy&#x2019;s potential to advance screening practices, public health policies, and trial design by enabling phenomapping, estimating subgroup-specific risk profiles, and establishing high-performance, cost-effective CCP for resource-limited regions. They noted its capability for testing effectiveness and cost-effectiveness in well-designed, prospective studies.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>This study represents one of the largest EHR analyses to date, employing diverse machine learning methods and robust validation approaches to classify subgroups and predict CIN2+/CIN3+ risk. By leveraging comprehensive and interconnected phenotypic features, our study identified 5 CCP subgroups with varying risks. CCP2&#x2013;4 had significantly higher risks of CIN2+ (CCP2: OR 2.07 [95% CI: 2.03&#x2010;2.12], CCP3: 3.88 [3.78&#x2010;3.97], CCP4: 4.47 [4.33&#x2010;4.63]) and CIN3+ (CCP2: 2.10 [2.05&#x2010;2.14], CCP3: 3.92 [3.82&#x2010;4.02], CCP4: 4.45 [4.31&#x2010;4.61]) compared to CCP1 (<italic>P</italic>&#x003C;.001), consistent with the direction of results observed in the external cohort. Our findings offer a robust foundation for the proposed triple SCREENing strategy. This tailored approach prioritizes high-risk subgroups, providing actionable insights for cervical cancer prevention, particularly in LMICs.</p><p>To this end, various approaches, including single-cell transcriptomic analysis [<xref ref-type="bibr" rid="ref49">49</xref>], sequence and phylogenetic analysis [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>], and cluster analysis [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref54">54</xref>], have been employed to define genetic and cellular heterogeneity [<xref ref-type="bibr" rid="ref55">55</xref>] in cervical cancer. These studies suggest that distinct subpopulations exhibit heterogeneous risk effects, linking individual features to varying absolute cervical cancer risk. Our 5 CCP subgroups align with findings from 2 major population-based clustering studies [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]. One study used a Poisson regression&#x2013;based CEM clustering algorithm [<xref ref-type="bibr" rid="ref56">56</xref>] to identify clusters of Indian states with similar cervical cancer incidence patterns. However, due to its focus on approximating missing data on sexual behavior, HPV prevalence, or cervical cancer incidence [<xref ref-type="bibr" rid="ref56">56</xref>], the clusters were not ideal for screening purposes. That study did not provide sufficient details to estimate cluster-specific risks, and its reliance on features not typically available in routine screening limited real-world applicability. Additionally, strict model assumptions and the inclusion of relatively few features further constrained its generalizability. Another study performed hierarchical clustering of HPV-related methylation sites to identify subgroups of patients with cervical cancer [<xref ref-type="bibr" rid="ref57">57</xref>]. While informative for prognosis and clinical management, the 3 clusters were not designed for cervical cancer screening. Instead, they are more suitable for guiding prognosis assessment, refining risk stratification, and optimizing treatment strategies in clinical practice.</p><p>In contrast, our study, specifically designed for cervical cancer screening, identified complex interactions among factors such as the number of infections, screening history, gynecological examination, hrHPV and HPV-16/18 infections, cervical cytology, time since previous screening, age, and possible hrHPV infection as key determinants of the 5 CCP subgroups with varying CIN2+/CIN3+ risks. Compared to previous studies [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>], our design and identified subgroups are more representative of real-world cervical cancer screening. Leveraging the comprehensive and interconnected phenotypic features from EHRs, our algorithm extracted CCP-specific risk estimates, providing a robust foundation for the proposed triple SCREENing strategy. This strategy prioritizes subgroups with differential CIN2+/CIN3+ risks, offering a tailored approach to CCP. We recommend implementing SCREENing as a supplemental tool to existing guidelines [<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>], while accounting for the unique priorities and constraints of LMICs. SCREENing enables clinicians to perform effective, risk-based screening, followed by adequate diagnosis, surveillance, and management, while empowering policy makers to optimize public health policies and resource allocation. This approach has the potential to mitigate resource shortages in LMICs, reduce delays in diagnosis and treatment, and enhance screening efficiency by focusing efforts on high-risk populations, ultimately maximizing population-level benefits. Additionally, our analysis highlights the modifying effect of age on CCP-specific CIN2+/CIN3+ risks, emphasizing the need for greater attention to menopause and age [<xref ref-type="bibr" rid="ref61">61</xref>] in cervical cancer screening strategies.</p><p>Methodologically, our study advances the external validation of machine learning algorithms for identifying subgroups and predicting cervical precancer or cancer risk using large-scale routine EHRs&#x2014;a rarity in previous studies, which have often been limited to small samples. Our robust, structured framework of internal, external, and diagnostic validation enhances the acceptability and generalizability of unsupervised and supervised machine learning approaches in routine CCP and is adaptable to other diseases. The identified subgroups demonstrated good accuracy and diagnostic validity for CIN2+/CIN3+ both within and across datasets, though performance was lower in scenarios with missing key features. Differences in diagnostic validity across datasets may reflect variations in HPV infection patterns and previous screening histories, which influence the distribution of risk factors. Our findings of 5 subgroups and the proposed strategy are novel, offering a framework for assessing validity in screening, follow-up surveillance, and treatment for cervical cancer. This study signals the potential for more effective and targeted approaches to CCP.</p><p>This study represents one of the largest EHR analyses to date, employing multiple machine learning methods, datasets, and validation approaches to classify subgroups and predict CIN2+/CIN3+ risk. However, there are several limitations. First, a major limitation of this study is that our models were not externally validated beyond China. HPV infection patterns and the epidemiology of cervical abnormalities differ across countries and regions, which may impact the generalizability of our models. Given this variability, and although we used data from 5 distinct regions within China, we strongly recommend further validation of our models&#x2019; performance before applying them in settings not included in this study. We acknowledge that externally validating the model in additional multicenter studies worldwide is crucial for assessing its transferability and applicability across different clinical settings. Additionally, the tool may face challenges in fully adapting to various real-world scenarios when implemented outside the controlled validation environment of this study. To address these concerns, we plan to conduct independent external and prospective validations, as well as pilot implementation across diverse clinical settings in future studies. These efforts will evaluate the model&#x2019;s effectiveness using a wider range of data, particularly in the context of real-world cervical cancer prevention across regions beyond those included in this study. We also encourage independent researchers to validate our model in their own settings, where feasible. While this study marks a significant step in the development of the SCREENing tool, we acknowledge that further research and validation are necessary to establish its effectiveness in real-world applications.</p><p>Second, we acknowledge that the use of retrospective EHR data may introduce biases and may not fully capture the real-time challenges of clinical practice. These challenges include issues such as missing data, data errors, and the heterogeneity of EHR systems across different settings. Although we made efforts to control for the quality of the EHR data, it remains inherently difficult to fully address these concerns without significant infrastructure changes, as well as ongoing monitoring and data validation. Therefore, we explicitly caution that the findings of this study should be interpreted with caution. In light of this limitation, future studies should aim to bridge the gap between retrospective analyses and the practical challenges of data collection in clinical settings. Third, while this study focused on routine EHR data, we acknowledge that incorporating multi-omics data&#x2014;such as genomic, proteomic, and imaging data&#x2014;could further enhance the model&#x2019;s robustness and performance, providing valuable new insights into cervical abnormalities. We propose this as an area for future research to better understand the progression of cervical cancer and to offer novel perspectives on controlling and eliminating cervical cancer. Fourth, due to the limitations of routinely collected EHR content, we were unable to include several key sexual behavior features, such as the number of sexual partners and oral contraceptive use [<xref ref-type="bibr" rid="ref62">62</xref>], in our analyses. These factors are known to significantly influence HPV infection and cervical cancer risk. While the model in this study demonstrated high performance, the absence of such data constrained our ability to further analyze the impact of sexual behaviors on findings, such as subgroup characterization, which could provide valuable insights. We recommend that future studies incorporate these data to validate our findings and offer a more comprehensive understanding of this field.</p><p>In conclusion, this study underscores the potential of leveraging machine learning algorithms and large-scale routine EHRs to enhance cervical cancer prevention strategies. By identifying key determinants of CIN2+/CIN3+ risk and classifying 5 distinct subgroups, our study provides a robust, data-driven foundation for the proposed triple SCREENing strategy. This approach prioritizes tailored prevention efforts for subgroups with varying risks, offering a novel and scalable tool to complement existing cervical cancer screening guidelines. Future work should focus on independent external and prospective validation to maximize the global impact of this strategy.</p></sec></body><back><ack><p>We thank all the contributors for their efforts in this study. We also thank all funding sources for their funding. This research was funded by Fujian Province's Third Batch of Flexible Introduction of High-Level Medical Talent Teams (TD202307), Merck Investigator Studies Program [100073, 59484], National Natural Science Foundation of China (82271658), Major Scientific Research Program for Young and Middle-aged Health Professionals of Fujian Province, China (2021ZQNZD011), Fujian Province Central Government-Guided Local Science and Technology Development Project (2023L3019), Fujian Provincial Health Technology Project (2024GGA061), and Fujian Provincial Science and Technology Innovation Joint Fund (2021Y9171).</p><p/></ack><notes><sec><title>Data Availability</title><p>The data that support the findings of this study are available from the corresponding authors upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>ZL conceived and designed the study in consultation with HZ. ZL analyzed the data and interpreted the results. ZL drafted the manuscript with all authors (BD, HC, TT, JW, LF, BW, WZ, TY, XT, JW, SL, XH, ZZ, HX, SX, SL, PS, and HZ) critically reviewing the manuscript. HZ and SL provided administrative and material support, as well as supervision and mentorship.</p><p>Each author contributed important intellectual content during drafting or revision of the manuscript and accepts accountability for the overall work by ensuring that questions pertaining to the accuracy or integrity of any portion of the work are appropriately investigated and resolved.</p><p>All authors had access to all the data in this study and approved the final version of the manuscript. The corresponding authors attests that all the listed authors meet the authorship criteria and that no others meeting the criteria have been omitted. We confirm that no generative AI tools, such as ChatGPT or other language models, were used in the writing or preparation of this manuscript.</p><p>S Liu, PS, and HZ are co-corresponding authors.</p><p>The complete address for the three co-corresponding authors are as follows:</p><p>S Liu: West Building 1 Medical Garden 4th floor, Gongchang Road 66, Sun Yat-sen University (Shenzhen Campus) Shenzhen, Guangming District, 518107, China; liusy99@mail.sysu.edu.cn (SL); +86 135 4329 6396.</p><p>PS: 18 Daoshan Road, Fuzhou 350001, Fujian, P.R. China (Phone: +86-591-87558732; Fax: +86-591-87551247; email: fmsun1975@fjmu.edu.cn).</p><p>HZ: Room 435, Bld #8, 130 Dongan Road, Xuhui District, Shanghai (200032), China; zouhuachun@fudan.edu.cn (HZ); +86 21 5423 7707.</p><p>ZL, BD, HC, TT, and Junfeng Wang are co-first authors.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CCP</term><def><p>cervical cancer prevention</p></def></def-item><def-item><term id="abb2">CIN</term><def><p>cervical intraepithelial neoplasia</p></def></def-item><def-item><term id="abb3">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb4">HPV</term><def><p>human papillomavirus</p></def></def-item><def-item><term id="abb5">hrHPV</term><def><p>high-risk HPV</p></def></def-item><def-item><term id="abb6">LMIC</term><def><p>low- and middle-income country</p></def></def-item><def-item><term id="abb7">OR</term><def><p>odds ratio</p></def></def-item><def-item><term id="abb8">OVR AUROC</term><def><p>one-versus-rest area under the receiver operating characteristics curve</p></def></def-item><def-item><term id="abb9">SCREENing</term><def><p>clinical Subgroups for CeRvical cancEr prEvention using computational pheNomaps and machine learnING</p></def></def-item><def-item><term id="abb10">SHAP</term><def><p>SHapley Additive exPlanations</p></def></def-item><def-item><term id="abb11">UMAP</term><def><p>uniform manifold approximation and projection</p></def></def-item><def-item><term id="abb12">WHO</term><def><p>World Health Organization</p></def></def-item><def-item><term id="abb13">XGBoost</term><def><p>eXtreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bray</surname><given-names>F</given-names> </name><name name-style="western"><surname>Laversanne</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title><source>CA Cancer J Clin</source><year>2024</year><volume>74</volume><issue>3</issue><fpage>229</fpage><lpage>263</lpage><pub-id pub-id-type="doi">10.3322/caac.21834</pub-id><pub-id pub-id-type="medline">38572751</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>YY</given-names> </name><name name-style="western"><surname>Su</surname><given-names>SY</given-names> </name><etal/></person-group><article-title>Projected time for the elimination of cervical cancer under various intervention scenarios: age-period-cohort macrosimulation study</article-title><source>JMIR Public Health Surveill</source><year>2024</year><month>04</month><day>18</day><volume>10</volume><fpage>e46360</fpage><pub-id pub-id-type="doi">10.2196/46360</pub-id><pub-id pub-id-type="medline">38635315</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lama</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jamison</surname><given-names>A</given-names> </name><name name-style="western"><surname>Quinn</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Broniatowski</surname><given-names>DA</given-names> </name></person-group><article-title>Characterizing trends in human papillomavirus vaccine discourse on Reddit (2007-2015): an observational study</article-title><source>JMIR Public Health Surveill</source><year>2019</year><month>03</month><day>27</day><volume>5</volume><issue>1</issue><fpage>e12480</fpage><pub-id pub-id-type="doi">10.2196/12480</pub-id><pub-id pub-id-type="medline">30916662</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Walboomers</surname><given-names>JMM</given-names> </name><name name-style="western"><surname>Jacobs</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Manos</surname><given-names>MM</given-names> </name><etal/></person-group><article-title>Human papillomavirus is a necessary cause of invasive cervical cancer worldwide</article-title><source>J Pathol</source><year>1999</year><month>09</month><volume>189</volume><issue>1</issue><fpage>12</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1002/(SICI)1096-9896(199909)189:1&#x003C;12::AID-PATH431&#x003E;3.0.CO;2-F</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>X</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Prognostic prediction models for oropharyngeal squamous cell carcinoma (OPSCC): a protocol for systematic review, critical appraisal and meta-analysis</article-title><source>BMJ Open</source><year>2023</year><month>10</month><day>12</day><volume>13</volume><issue>10</issue><fpage>e073375</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2023-073375</pub-id><pub-id pub-id-type="medline">37827742</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>SP</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>XY</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>CF</given-names> </name></person-group><article-title>The prognostic and predictive effects of human papillomavirus status in hypopharyngeal carcinoma: population-based study</article-title><source>JMIR Public Health Surveill</source><year>2022</year><month>12</month><day>16</day><volume>8</volume><issue>12</issue><fpage>e40185</fpage><pub-id pub-id-type="doi">10.2196/40185</pub-id><pub-id pub-id-type="medline">36525304</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Bian</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>H</given-names> </name></person-group><article-title>Association between chronic viral infection-related hospitalization and risk of cardiovascular disease: a population-based cohort study</article-title><source>J Med Virol</source><year>2024</year><month>01</month><volume>96</volume><issue>1</issue><fpage>e29350</fpage><pub-id pub-id-type="doi">10.1002/jmv.29350</pub-id><pub-id pub-id-type="medline">38180233</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>WHO</collab></person-group><source>Global strategy to accelerate the elimination of cervical cancer as a public health problem</source><year>2020</year><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/9789240014107">https://www.who.int/publications/i/item/9789240014107</ext-link></comment></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bruni</surname><given-names>L</given-names> </name><name name-style="western"><surname>Serrano</surname><given-names>B</given-names> </name><name name-style="western"><surname>Roura</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Cervical cancer screening programmes and age-specific coverage estimates for 202 countries and territories worldwide: a review and synthetic analysis</article-title><source>Lancet Glob Health</source><year>2022</year><month>08</month><volume>10</volume><issue>8</issue><fpage>e1115</fpage><lpage>e1127</lpage><pub-id pub-id-type="doi">10.1016/S2214-109X(22)00241-8</pub-id><pub-id pub-id-type="medline">35839811</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gravitt</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Silver</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Hussey</surname><given-names>HM</given-names> </name><etal/></person-group><article-title>Achieving equity in cervical cancer screening in low- and middle-income countries (LMICs): strengthening health systems using a systems thinking approach</article-title><source>Prev Med</source><year>2021</year><month>03</month><volume>144</volume><fpage>106322</fpage><pub-id pub-id-type="doi">10.1016/j.ypmed.2020.106322</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arbyn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Simon</surname><given-names>M</given-names> </name><name name-style="western"><surname>Peeters</surname><given-names>E</given-names> </name><etal/></person-group><article-title>2020 list of human papillomavirus assays suitable for primary cervical cancer screening</article-title><source>Clin Microbiol Infect</source><year>2021</year><month>08</month><volume>27</volume><issue>8</issue><fpage>1083</fpage><lpage>1095</lpage><pub-id pub-id-type="doi">10.1016/j.cmi.2021.04.031</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Poljak</surname><given-names>M</given-names> </name><name name-style="western"><surname>O&#x0161;trbenk Valen&#x010D;ak</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gimpelj Domjani&#x010D;</surname><given-names>G</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Arbyn</surname><given-names>M</given-names> </name></person-group><article-title>Commercially available molecular tests for human papillomaviruses: a global overview</article-title><source>Clin Microbiol Infect</source><year>2020</year><month>09</month><volume>26</volume><issue>9</issue><fpage>1144</fpage><lpage>1150</lpage><pub-id pub-id-type="doi">10.1016/j.cmi.2020.03.033</pub-id><pub-id pub-id-type="medline">32247892</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arbyn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Verdoodt</surname><given-names>F</given-names> </name><name name-style="western"><surname>Snijders</surname><given-names>PJF</given-names> </name><etal/></person-group><article-title>Accuracy of human papillomavirus testing on self-collected versus clinician-collected samples: a meta-analysis</article-title><source>Lancet Oncol</source><year>2014</year><month>02</month><volume>15</volume><issue>2</issue><fpage>172</fpage><lpage>183</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(13)70570-9</pub-id><pub-id pub-id-type="medline">24433684</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mezei</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Armstrong</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Pedersen</surname><given-names>HN</given-names> </name><etal/></person-group><article-title>Cost-effectiveness of cervical cancer screening methods in low- and middle-income countries: a systematic review</article-title><source>Int J Cancer</source><year>2017</year><month>08</month><day>1</day><volume>141</volume><issue>3</issue><fpage>437</fpage><lpage>446</lpage><pub-id pub-id-type="doi">10.1002/ijc.30695</pub-id><pub-id pub-id-type="medline">28297074</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Camara</surname><given-names>H</given-names> </name><name name-style="western"><surname>Nosi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Munnull</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Women&#x2019;s acceptability of a self-collect HPV same-day screen-and-treat program in a high burden setting in the Pacific</article-title><source>BMC Health Serv Res</source><year>2022</year><month>12</month><day>12</day><volume>22</volume><issue>1</issue><fpage>1514</fpage><pub-id pub-id-type="doi">10.1186/s12913-022-08842-1</pub-id><pub-id pub-id-type="medline">36510192</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ronco</surname><given-names>G</given-names> </name><name name-style="western"><surname>Dillner</surname><given-names>J</given-names> </name><name name-style="western"><surname>Elfstr&#x00F6;m</surname><given-names>KM</given-names> </name><etal/></person-group><article-title>Efficacy of HPV-based screening for prevention of invasive cervical cancer: follow-up of four European randomised controlled trials</article-title><source>The Lancet</source><year>2014</year><month>02</month><volume>383</volume><issue>9916</issue><fpage>524</fpage><lpage>532</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(13)62218-7</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arbyn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ronco</surname><given-names>G</given-names> </name><name name-style="western"><surname>Anttila</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Evidence regarding human papillomavirus testing in secondary prevention of cervical cancer</article-title><source>Vaccine (Auckl)</source><year>2012</year><month>11</month><day>20</day><volume>30 Suppl 5</volume><fpage>F88</fpage><lpage>99</lpage><pub-id pub-id-type="doi">10.1016/j.vaccine.2012.06.095</pub-id><pub-id pub-id-type="medline">23199969</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bouvard</surname><given-names>V</given-names> </name><name name-style="western"><surname>Wentzensen</surname><given-names>N</given-names> </name><name name-style="western"><surname>Mackie</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The IARC perspective on cervical cancer screening</article-title><source>N Engl J Med</source><year>2021</year><month>11</month><day>11</day><volume>385</volume><issue>20</issue><fpage>1908</fpage><lpage>1918</lpage><pub-id pub-id-type="doi">10.1056/NEJMsr2030640</pub-id><pub-id pub-id-type="medline">34758259</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>WHO</collab></person-group><source>Guidelines for screening and treatment of precancerous lesions for cervical cancer prevention</source><year>2021</year><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/9789240030824">https://www.who.int/publications/i/item/9789240030824</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mungo</surname><given-names>C</given-names> </name><name name-style="western"><surname>Guliam</surname><given-names>A</given-names> </name><name name-style="western"><surname>Chinula</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Comparison of the ScreenFire and Xpert HPV assays for the detection of human papillomavirus and cervical precancer among women living with HIV in Malawi</article-title><source>medRxiv</source><year>2024</year><month>02</month><day>23</day><fpage>2024.02.21.24303142</fpage><pub-id pub-id-type="doi">10.1101/2024.02.21.24303142</pub-id><pub-id pub-id-type="medline">38617305</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="report"><person-group person-group-type="author"><collab>WHO</collab></person-group><article-title>Comprehensive cervical cancer control: a guide to essential practice</article-title><year>2014</year></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheung</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Egemen</surname><given-names>D</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><etal/></person-group><article-title>2019 ASCCP risk-based management consensus guidelines: methods for risk estimation, recommended management, and validation</article-title><source>J Low Genit Tract Dis</source><year>2020</year><month>04</month><volume>24</volume><issue>2</issue><fpage>90</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1097/LGT.0000000000000528</pub-id><pub-id pub-id-type="medline">32243306</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Weng</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Diagnosis of neurosyphilis in HIV-negative patients with syphilis: development, validation, and clinical utility of a suite of machine learning models</article-title><source>EClinicalMedicine</source><year>2023</year><month>08</month><volume>62</volume><fpage>102080</fpage><pub-id pub-id-type="doi">10.1016/j.eclinm.2023.102080</pub-id><pub-id pub-id-type="medline">37533423</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oikonomou</surname><given-names>EK</given-names> </name><name name-style="western"><surname>Spatz</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Suchard</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Khera</surname><given-names>R</given-names> </name></person-group><article-title>Individualising intensive systolic blood pressure reduction in hypertension using computational trial phenomaps and machine learning: a post-hoc analysis of randomised clinical trials</article-title><source>Lancet Digit Health</source><year>2022</year><month>11</month><volume>4</volume><issue>11</issue><fpage>e796</fpage><lpage>e805</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(22)00170-4</pub-id><pub-id pub-id-type="medline">36307193</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Melnikow</surname><given-names>J</given-names> </name><name name-style="western"><surname>Henderson</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Burda</surname><given-names>BU</given-names> </name><name name-style="western"><surname>Senger</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Durbin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Weyrich</surname><given-names>MS</given-names> </name></person-group><article-title>Screening for cervical cancer with high-risk human papillomavirus testing: updated evidence report and systematic review for the US Preventive Services Task Force</article-title><source>J Am Med Assoc</source><year>2018</year><month>08</month><day>21</day><volume>320</volume><issue>7</issue><fpage>687</fpage><lpage>705</lpage><pub-id pub-id-type="doi">10.1001/jama.2018.10400</pub-id><pub-id pub-id-type="medline">30140883</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xiao</surname><given-names>T</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Use of virus genotypes in machine learning diagnostic prediction models for cervical cancer in women with high-risk human papillomavirus infection</article-title><source>JAMA Netw Open</source><year>2023</year><month>08</month><day>1</day><volume>6</volume><issue>8</issue><fpage>e2326890</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.26890</pub-id><pub-id pub-id-type="medline">37531108</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Waal</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bekkers</surname><given-names>RLM</given-names> </name><name name-style="western"><surname>Dick</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Risk prediction of cervical abnormalities: the value of sociodemographic and lifestyle factors in addition to HPV status</article-title><source>Prev Med</source><year>2020</year><month>01</month><volume>130</volume><fpage>105927</fpage><pub-id pub-id-type="doi">10.1016/j.ypmed.2019.105927</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rothberg</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lipold</surname><given-names>L</given-names> </name><etal/></person-group><article-title>A risk prediction model to allow personalized screening for cervical cancer</article-title><source>Cancer Causes Control</source><year>2018</year><month>03</month><volume>29</volume><issue>3</issue><fpage>297</fpage><lpage>304</lpage><pub-id pub-id-type="doi">10.1007/s10552-018-1013-4</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Li</surname><given-names>RN</given-names> </name><etal/></person-group><article-title>Risk evaluation for the development of cervical intraepithelial neoplasia: development and validation of risk-scoring schemes</article-title><source>Int J Cancer</source><year>2015</year><month>01</month><day>15</day><volume>136</volume><issue>2</issue><fpage>340</fpage><lpage>349</lpage><pub-id pub-id-type="doi">10.1002/ijc.28982</pub-id><pub-id pub-id-type="medline">24841989</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bouvard</surname><given-names>V</given-names> </name><name name-style="western"><surname>Baan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Straif</surname><given-names>K</given-names> </name><etal/></person-group><article-title>A review of human carcinogens--Part B: biological agents</article-title><source>Lancet Oncol</source><year>2009</year><month>04</month><volume>10</volume><issue>4</issue><fpage>321</fpage><lpage>322</lpage><pub-id pub-id-type="doi">10.1016/s1470-2045(09)70096-8</pub-id><pub-id pub-id-type="medline">19350698</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schreiberhuber</surname><given-names>L</given-names> </name><name name-style="western"><surname>Barrett</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Cervical cancer screening using DNA methylation triage in a real-world population</article-title><source>Nat Med</source><year>2024</year><month>08</month><volume>30</volume><issue>8</issue><fpage>2251</fpage><lpage>2257</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-03014-6</pub-id><pub-id pub-id-type="medline">38834848</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marcus</surname><given-names>JZ</given-names> </name><name name-style="western"><surname>Cason</surname><given-names>P</given-names> </name><name name-style="western"><surname>Downs</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Einstein</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Flowers</surname><given-names>L</given-names> </name></person-group><article-title>The ASCCP Cervical Cancer Screening Task Force Endorsement and Opinion on the American Cancer Society updated cervical cancer screening guidelines</article-title><source>J Low Genit Tract Dis</source><year>2021</year><month>07</month><day>1</day><volume>25</volume><issue>3</issue><fpage>187</fpage><lpage>191</lpage><pub-id pub-id-type="doi">10.1097/LGT.0000000000000614</pub-id><pub-id pub-id-type="medline">34138787</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moy</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>FH</given-names> </name><name name-style="western"><surname>Li</surname><given-names>LY</given-names> </name><etal/></person-group><article-title>Human papillomavirus testing and cervical cytology in primary screening for cervical cancer among women in rural China: comparison of sensitivity, specificity, and frequency of referral</article-title><source>Int J Cancer</source><year>2010</year><month>08</month><day>1</day><volume>127</volume><issue>3</issue><fpage>646</fpage><lpage>656</lpage><pub-id pub-id-type="doi">10.1002/ijc.25071</pub-id><pub-id pub-id-type="medline">19960441</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saslow</surname><given-names>D</given-names> </name><name name-style="western"><surname>Solomon</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lawson</surname><given-names>HW</given-names> </name><etal/></person-group><article-title>American Cancer Society, American Society for Colposcopy and Cervical Pathology, and American Society for Clinical Pathology screening guidelines for the prevention and early detection of cervical cancer</article-title><source>Am J Clin Pathol</source><year>2012</year><month>04</month><volume>137</volume><issue>4</issue><fpage>516</fpage><lpage>542</lpage><pub-id pub-id-type="doi">10.1309/AJCPTGD94EVRSJCG</pub-id><pub-id pub-id-type="medline">22431528</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gower</surname><given-names>JC</given-names> </name></person-group><article-title>A general coefficient of similarity and some of its properties</article-title><source>Biometrics</source><year>1971</year><month>12</month><volume>27</volume><issue>4</issue><fpage>857</fpage><pub-id pub-id-type="doi">10.2307/2528823</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>McInnes</surname><given-names>L</given-names> </name><name name-style="western"><surname>Healy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Saul</surname><given-names>N</given-names> </name><name name-style="western"><surname>Gro&#x00DF;berger</surname><given-names>L</given-names> </name></person-group><article-title>UMAP: uniform manifold approximation and projection</article-title><source>arXiv</source><comment>Preprint posted online on 2018</comment><comment>arXiv:180203426</comment></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reese</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Blau</surname><given-names>H</given-names> </name><name name-style="western"><surname>Casiraghi</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Generalisable long COVID subtypes: findings from the NIH N3C and RECOVER programmes</article-title><source>eBioMedicine</source><year>2023</year><month>01</month><volume>87</volume><fpage>104413</fpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2022.104413</pub-id><pub-id pub-id-type="medline">36563487</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>W</given-names> </name><name name-style="western"><surname>He</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>Q</given-names> </name></person-group><article-title>Latent class analysis-derived classification improves the cancer-specific death stratification of molecular subtyping in colorectal cancer</article-title><source>NPJ Precis Oncol</source><year>2023</year><month>06</month><day>23</day><volume>7</volume><issue>1</issue><fpage>60</fpage><pub-id pub-id-type="doi">10.1038/s41698-023-00412-w</pub-id><pub-id pub-id-type="medline">37353681</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Faghri</surname><given-names>F</given-names> </name><name name-style="western"><surname>Brunn</surname><given-names>F</given-names> </name><name name-style="western"><surname>Dadu</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Identifying and predicting amyotrophic lateral sclerosis clinical subgroups: a population-based machine-learning study</article-title><source>Lancet Digit Health</source><year>2022</year><month>05</month><volume>4</volume><issue>5</issue><fpage>e359</fpage><lpage>e369</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(21)00274-0</pub-id><pub-id pub-id-type="medline">35341712</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Hesitancy to undergo SARS-CoV-2 rapid antigen testing in China: nationwide cross-sectional study</article-title><source>JMIR Public Health Surveill</source><year>2023</year><month>05</month><day>1</day><volume>9</volume><fpage>e43555</fpage><pub-id pub-id-type="doi">10.2196/43555</pub-id><pub-id pub-id-type="medline">36888911</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Al-Aly</surname><given-names>Z</given-names> </name></person-group><article-title>Long-term neurologic outcomes of COVID-19</article-title><source>Nat Med</source><year>2022</year><month>11</month><volume>28</volume><issue>11</issue><fpage>2406</fpage><lpage>2415</lpage><pub-id pub-id-type="doi">10.1038/s41591-022-02001-z</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="confproc"><person-group person-group-type="editor"><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>XGBoost: a scalable tree boosting system</article-title><year>2016</year><conf-name>KDD '16: The 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Erion</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name><etal/></person-group><article-title>From local explanations to global understanding with explainable AI for trees</article-title><source>Nat Mach Intell</source><year>2020</year><month>01</month><volume>2</volume><issue>1</issue><fpage>56</fpage><lpage>67</lpage><pub-id pub-id-type="doi">10.1038/s42256-019-0138-9</pub-id><pub-id pub-id-type="medline">32607472</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>W</given-names> </name><name name-style="western"><surname>Phung</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tran</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title><source>J Med Internet Res</source><year>2016</year><month>12</month><day>16</day><volume>18</volume><issue>12</issue><fpage>e323</fpage><pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id><pub-id pub-id-type="medline">27986644</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Reitsma</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name></person-group><article-title>Transparent reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis (TRIPOD): The TRIPOD statement</article-title><source>Ann Intern Med</source><year>2015</year><month>01</month><day>6</day><volume>162</volume><issue>1</issue><fpage>55</fpage><lpage>63</lpage><pub-id pub-id-type="doi">10.7326/M14-0697</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name></person-group><source>lulab.utils: Supporting Functions Maintained by Zhen Lu</source><year>2024</year><comment><ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=lulab.utils">https://CRAN.R-project.org/package=lulab.utils</ext-link></comment></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>Z</given-names> </name></person-group><source>SCREENing</source><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/Leslie-Lu/SCREENing">https://github.com/Leslie-Lu/SCREENing</ext-link></comment></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosty</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sheffer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tsafrir</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Identification of a proliferation gene cluster associated with HPV E6/E7 expression level and viral DNA load in invasive cervical carcinoma</article-title><source>Oncogene</source><year>2005</year><month>10</month><day>27</day><volume>24</volume><issue>47</issue><fpage>7094</fpage><lpage>7104</lpage><pub-id pub-id-type="doi">10.1038/sj.onc.1208854</pub-id><pub-id pub-id-type="medline">16007141</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Identification of HPV oncogene and host cell differentiation associated cellular heterogeneity in cervical cancer via single&#x2010;cell transcriptomic analysis</article-title><source>J Med Virol</source><year>2023</year><month>08</month><volume>95</volume><issue>8</issue><pub-id pub-id-type="doi">10.1002/jmv.29060</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sait</surname><given-names>K</given-names> </name><name name-style="western"><surname>Turki</surname><given-names>R</given-names> </name><name name-style="western"><surname>Abuzenadah</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Jiffiri</surname><given-names>OH</given-names> </name><name name-style="western"><surname>Bohmaidah</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sohrab</surname><given-names>SS</given-names> </name></person-group><article-title>Genetic diversity and phylogenetic analysis of HPV 16 &#x0026; 18 variants isolated from cervical specimens of women in Saudi Arabia</article-title><source>Saudi J Biol Sci</source><year>2019</year><month>02</month><volume>26</volume><issue>2</issue><fpage>317</fpage><lpage>324</lpage><pub-id pub-id-type="doi">10.1016/j.sjbs.2018.05.005</pub-id><pub-id pub-id-type="medline">31485171</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Balanda</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fern&#x00E1;ndez</surname><given-names>J</given-names> </name><name name-style="western"><surname>Vergara</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Genetic variability of human papillomavirus type 66 L1 gene among women presenting for cervical cancer screening in Chile</article-title><source>Med Microbiol Immunol</source><year>2019</year><month>12</month><volume>208</volume><issue>6</issue><fpage>757</fpage><lpage>771</lpage><pub-id pub-id-type="doi">10.1007/s00430-019-00621-w</pub-id><pub-id pub-id-type="medline">31165237</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wan</surname><given-names>F</given-names> </name><name name-style="western"><surname>Miao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Quraishi</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kennedy</surname><given-names>V</given-names> </name><name name-style="western"><surname>Creek</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Pirisi</surname><given-names>L</given-names> </name></person-group><article-title>Gene expression changes during HPV-mediated carcinogenesis: a comparison between an in vitro cell model and cervical cancer</article-title><source>Int J Cancer</source><year>2008</year><month>07</month><day>1</day><volume>123</volume><issue>1</issue><fpage>32</fpage><lpage>40</lpage><pub-id pub-id-type="doi">10.1002/ijc.23463</pub-id><pub-id pub-id-type="medline">18398830</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>V&#x00E1;zquez-Ort&#x00ED;z</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ciudad</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Pi&#x00F1;a</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Gene identification by cDNA arrays in HPV-positive cervical cancer</article-title><source>Arch Med Res</source><year>2005</year><volume>36</volume><issue>5</issue><fpage>448</fpage><lpage>458</lpage><pub-id pub-id-type="doi">10.1016/j.arcmed.2005.04.016</pub-id><pub-id pub-id-type="medline">16099320</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Widschwendter</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gattringer</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ivarsson</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Analysis of aberrant DNA methylation and human papillomavirus DNA in cervicovaginal specimens to detect invasive cervical cancer and its precursors</article-title><source>Clin Cancer Res</source><year>2004</year><month>05</month><day>15</day><volume>10</volume><issue>10</issue><fpage>3396</fpage><lpage>3400</lpage><pub-id pub-id-type="doi">10.1158/1078-0432.CCR-03-0143</pub-id><pub-id pub-id-type="medline">15161694</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shiri Aghbash</surname><given-names>P</given-names> </name><name name-style="western"><surname>Shirvaliloo</surname><given-names>M</given-names> </name><name name-style="western"><surname>Khalo Abass Kasho</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alinezhad</surname><given-names>F</given-names> </name><name name-style="western"><surname>Nauwynck</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bannazadeh Baghi</surname><given-names>H</given-names> </name></person-group><article-title>Cluster of differentiation frequency on antigen presenting-cells: the next step to cervical cancer prognosis?</article-title><source>Int Immunopharmacol</source><year>2022</year><month>07</month><volume>108</volume><fpage>108896</fpage><pub-id pub-id-type="doi">10.1016/j.intimp.2022.108896</pub-id><pub-id pub-id-type="medline">35640377</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Man</surname><given-names>I</given-names> </name><name name-style="western"><surname>Georges</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bonjour</surname><given-names>M</given-names> </name><name name-style="western"><surname>Baussano</surname><given-names>I</given-names> </name></person-group><article-title>Approximating missing epidemiological data for cervical cancer through footprinting: a case study in India</article-title><source>Elife</source><year>2023</year><month>05</month><day>25</day><volume>12</volume><fpage>e81752</fpage><pub-id pub-id-type="doi">10.7554/eLife.81752</pub-id><pub-id pub-id-type="medline">37227260</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>S</given-names> </name><etal/></person-group><article-title>HPV-related methylation-based reclassification and risk stratification of cervical cancer</article-title><source>Mol Oncol</source><year>2020</year><month>09</month><volume>14</volume><issue>9</issue><fpage>2124</fpage><lpage>2141</lpage><pub-id pub-id-type="doi">10.1002/1878-0261.12709</pub-id><pub-id pub-id-type="medline">32408396</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sui</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Guidelines for cervical cancer screening in China</article-title><source>Gynecol Obstet Clin Med</source><year>2023</year><month>12</month><volume>3</volume><issue>4</issue><fpage>189</fpage><lpage>194</lpage><pub-id pub-id-type="doi">10.1016/j.gocm.2023.10.005</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sawaya</surname><given-names>GF</given-names> </name><name name-style="western"><surname>Smith-McCune</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kuppermann</surname><given-names>M</given-names> </name></person-group><article-title>Cervical cancer screening: more choices in 2019</article-title><source>J Am Med Assoc</source><year>2019</year><month>05</month><day>28</day><volume>321</volume><issue>20</issue><fpage>2018</fpage><lpage>2019</lpage><pub-id pub-id-type="doi">10.1001/jama.2019.4595</pub-id><pub-id pub-id-type="medline">31135834</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Arc&#x00E0;</surname><given-names>E</given-names> </name><name name-style="western"><surname>Sinha</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hartl</surname><given-names>K</given-names> </name><name name-style="western"><surname>Houwing</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kothari</surname><given-names>S</given-names> </name></person-group><article-title>Cervical cancer screening guidelines and screening practices in 11 countries: a systematic literature review</article-title><source>Prev Med Rep</source><year>2022</year><month>08</month><volume>28</volume><fpage>101813</fpage><pub-id pub-id-type="doi">10.1016/j.pmedr.2022.101813</pub-id><pub-id pub-id-type="medline">35637896</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hickey</surname><given-names>M</given-names> </name><name name-style="western"><surname>Basu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sassarini</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Managing menopause after cancer</article-title><source>The Lancet</source><year>2024</year><month>03</month><volume>403</volume><issue>10430</issue><fpage>984</fpage><lpage>996</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(23)02802-7</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gierisch</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Coeytaux</surname><given-names>RR</given-names> </name><name name-style="western"><surname>Urrutia</surname><given-names>RP</given-names> </name><etal/></person-group><article-title>Oral contraceptive use and risk of breast, cervical, colorectal, and endometrial cancers: a systematic review</article-title><source>Cancer Epidemiol Biomarkers Prev</source><year>2013</year><month>11</month><day>1</day><volume>22</volume><issue>11</issue><fpage>1931</fpage><lpage>1943</lpage><pub-id pub-id-type="doi">10.1158/1055-9965.EPI-13-0298</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Data Supplement.</p><media xlink:href="publichealth_v11i1e67840_app1.docx" xlink:title="DOCX File, 380 KB"/></supplementary-material></app-group></back></article>