<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e41162</article-id>
      <article-id pub-id-type="pmid">36696166</article-id>
      <article-id pub-id-type="doi">10.2196/41162</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Predicting Risky Sexual Behavior Among College Students Through Machine Learning Approaches: Cross-sectional Analysis of Individual Data From 1264 Universities in 31 Provinces in China</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Eleftheriou</surname>
            <given-names>Anastasia</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chiou</surname>
            <given-names>Piao-Yi</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Xuan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7366-7517</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Hanxiyue</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4333-9293</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Shuangyu</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0454-872X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Tang</surname>
            <given-names>Kun</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Vanke School of Public Health</institution>
            <institution>Tsinghua University</institution>
            <addr-line>No 30 Shuangqing Road</addr-line>
            <addr-line>Haidian District</addr-line>
            <addr-line>Beijing, 100084</addr-line>
            <country>China</country>
            <phone>86 13671129425</phone>
            <email>tangk@mail.tsinghua.edu.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5444-186X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Vanke School of Public Health</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Kun Tang <email>tangk@mail.tsinghua.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>25</day>
        <month>1</month>
        <year>2023</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>e41162</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>30</day>
          <month>11</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Xuan Li, Hanxiyue Zhang, Shuangyu Zhao, Kun Tang. Originally published in JMIR Public Health and Surveillance (https://publichealth.jmir.org), 25.01.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on https://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://publichealth.jmir.org/2023/1/e41162" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Risky sexual behavior (RSB), the most direct risk factor for sexually transmitted infections (STIs), is common among college students. Thus, identifying relevant risk factors and predicting RSB are important to intervene and prevent RSB among college students.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aim to establish a predictive model for RSB among college students to facilitate timely intervention and the prevention of RSB to help limit STI contraction.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We included a total of 8794 heterosexual Chinese students who self-reported engaging in sexual intercourse from November 2019 to February 2020. We identified RSB among those students and attributed it to 4 dimensions: whether contraception was used, whether the contraceptive method was safe, whether students engaged in casual sex or sex with multiple partners, and integrated RSB (which combined the first 3 dimensions). Overall, 126 predictors were included in this study, including demographic characteristics, daily habits, physical and mental health, relationship status, sexual knowledge, sexual education, sexual attitude, and previous sexual experience. For each type of RSB, we compared 8 machine learning (ML) models: multiple logistic regression (MLR), naive Bayes (BYS), linear discriminant analysis (LDA), random forest (RF), gradient boosting machine (GBM), extreme gradient boosting (XGBoost), deep learning (DL), and the ensemble model. The optimal model for both RSB prediction and risk factor identification was selected based on a set of validation indicators. An MLR model was applied to investigate the association between RSB and identified risk factors through ML methods.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In total, 5328 (60.59%) students were found to have previously engaged in RSB. Among them, 3682 (41.87%) did not use contraception every time they had sexual intercourse, 3602 (40.96%) had previously used an ineffective or unsafe contraceptive method, and 1157 (13.16%) had engaged in casual sex or sex with multiple partners. XGBoost achieved the optimal predictive performance on all 4 types of RSB, with the area under the receiver operator characteristic curve (AUROC) reaching 0.78, 0.72, 0.94, and 0.80 for contraceptive use, safe contraceptive method use, engagement in casual sex or with multiple partners, and integrated RSB, respectively. By ensuring the stability of various validation indicators, the 12 most predictive variables were then selected using XGBoost, including the participants’ relationship status, sexual knowledge, sexual attitude, and previous sexual experience. Through MLR, RSB was found to be significantly associated with less sexual knowledge, more liberal sexual attitudes, single relationship status, and increased sexual experience.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>RSB is prevalent among college students. The XGBoost model is an effective approach to predict RSB and identify corresponding risk factors. This study presented an opportunity to promote sexual and reproductive health through ML models, which can help targeted interventions aimed at different subgroups and the precise surveillance and prevention of RSB among college students through risk probability prediction.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>risky sexual behavior</kwd>
        <kwd>sexually transmitted infections</kwd>
        <kwd>college students</kwd>
        <kwd>machine learning</kwd>
        <kwd>prediction</kwd>
        <kwd>students</kwd>
        <kwd>risk factor</kwd>
        <kwd>STI</kwd>
        <kwd>intervention</kwd>
        <kwd>China</kwd>
        <kwd>sex</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Risky sexual behavior (RSB) is defined as sexual activities that are more likely to lead to the risk of sexually transmitted infections (STIs) and unwanted pregnancies [<xref ref-type="bibr" rid="ref1">1</xref>], including sex without contraceptive use and sex with an ineffective or unsafe contraceptive method. It is a serious issue among college students worldwide, especially in low- and middle-income countries [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Among 5 types of contraceptive methods under the classification criterion from the World Health Organization (WHO) [<xref ref-type="bibr" rid="ref4">4</xref>], condoms and hormonal contraceptive methods are regarded as safe and highly effective for adolescents [<xref ref-type="bibr" rid="ref5">5</xref>]. Studies have shown that consistent condom use is low among college students [<xref ref-type="bibr" rid="ref6">6</xref>]. In previous research, it was estimated that approximately 40% of students did not use a condom during their last sexual encounter [<xref ref-type="bibr" rid="ref7">7</xref>]. Casual sex and sex with multiple partners have also been regarded as RSBs [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Nearly half of the college students had casual sex experience [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], and approximately 50.7% of students were sexually active, with 42.3% of students having multiple sexual partners [<xref ref-type="bibr" rid="ref13">13</xref>]. Thus, to help reduce the influence of RSB, it is important to intervene and prevent it among college students by identifying relevant risk factors and making RSB predictions.</p>
      <p>A number of association studies have focused on the risk factors for RSB. A systematic review of 30 papers summarized 11 aspects of risk factors of RSB including sociodemographics, gender roles, substance use, and partner characteristics [<xref ref-type="bibr" rid="ref14">14</xref>]. It was widely validated that being male [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], drinking alcohol [<xref ref-type="bibr" rid="ref17">17</xref>], experiencing poverty, and experiencing peer pressure [<xref ref-type="bibr" rid="ref18">18</xref>] are significant risk factors for RSB [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Mental health has also been linked to RSB, with higher depression resulting in more RSB and STIs [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. In addition, numerous public health and sociological studies have found that romantic relationship status [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], sexual knowledge [<xref ref-type="bibr" rid="ref1">1</xref>], and sexual attitude have a significant influence on RSB [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. However, few studies have fully used these identified factors to make RSB predictions.</p>
      <p>Previous predictive studies on RSB have mostly been based on conventional regression models, which have high limitations of assumption and less ideal effects on RSB prediction. To fill such gaps, machine learning (ML) offers a possible alternative for factor identification and outcome prediction. In the past few years, a large number of studies have emerged using ML to predict the occurrence of STIs, which have achieved ideal performance [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. However, RSB, as the main transmission route for STIs, has gained little attention from ML for prediction.</p>
      <p>The objective of this study was to develop an ML-based model to precisely predict RSB in college students. Through a cross-province survey in China, this study aimed to develop a series of ML models to predict different types of RSB among Chinese college students. By comparison, we adopted the optimal model to identify key risk factors to help recognize and predict college students’ engagement in RSB, thus facilitating more precise intervention and prevention.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Participants and Research Procedures</title>
        <p>We conducted a large-scale and internet-based survey, the National College Student Survey on Sexual and Reproductive Health in 2020 (NCSS-SRH 2020), sponsored by the China Family Planning Association (CFPA). Through multistage sampling from November 2019 to February 2020, a total of 55,757 Chinese college students from 241 universities completed the questionnaire survey. Voluntary participants were recruited using snowball sampling, and informed consent was obtained from each participant before completing the survey.</p>
        <p>Among all participants, 1177 (2.11%) were excluded for either failing the attention check questions, ignoring the informed consent, or being outside the age range for college students (15-24 years old according to a standard definition of late adolescence and young adulthood by WHO) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Samples with duplicated answers and variables with missing values over 5% were deleted. For the remaining variables, missing values were imputed with the use of multiple imputation. Due to the constraint of sexual orientation and past sexual experience, 8794 (15.78%) self-identified heterosexual students with sexual intercourse experience were finally included in the analyses.</p>
      </sec>
      <sec>
        <title>RSB Outcomes</title>
        <p>We classified RSB from 4 perspectives: (1) whether contraception was used, (2) whether the contraceptive method was effective and safe, (3) whether participants engaged in casual sex or sex with multiple partners, and (4) the integration of the former 3 perspectives.</p>
        <p>Contraception use was evaluated through 2 dimensions. Regarding frequency, contraception use was measured by the question “Do you use contraception while having sex every time you have sexual intercourse?” Regarding practices, contraception use was measured by the question “Did you/your partner use contraception the last time you had sex?” For both questions, a “no” response was considered to indicate RSB. According to WHO guidance, 4 contraceptive types with over 10 specific methods were investigated as contraception use: hormonal contraceptive methods, intrauterine devices, emergency contraception, and condoms [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>The effectiveness and safety of contraception was mainly determined by the method of contraception. If someone reported using “emergency contraception,” “external ejaculation,” or a “safe period” for contraception, they were considered a member of the RSB group. The effectiveness and safety of contraception were also evaluated through the frequency and practice dimensions, which were, respectively, measured by the question of whether such approaches were taken every time or the last time of sexual intercourse.</p>
        <p>Casual or multiple sex was assessed with the following questions: “Have you ever had sex through ‘booty calls’, ‘one-night stands’, ‘buying sex’, or ‘sex with multiple partners’?” As before, a “yes” response was considered RSB.</p>
        <p>Finally, integrated RSB dimension was the combination of contraception use, the safety of contraception, and casual sex or sex with multiple partners. As long as 1 of these 3 types of behaviors occurred, we considered the student to have met the criteria for integrated RSB.</p>
      </sec>
      <sec>
        <title>Predictors</title>
        <p>We included 126 potential predictors, including baseline characteristics (sex, age, ethnicity, religion, income, parental information, etc), daily habits (exercise, appearance and popularity, mobile phone addiction, alcohol and tobacco consumption, etc), physical and mental health status, relationship status, sexual knowledge, sexual education, sexual attitude, previous sexual experience, experience of sexual harassment and assault, etc. Among them, the age of the participant, the age of the participant’s partner, the income and expenditure of the participant, and the frequency of sports were treated as continuous variables. Other variables, including the degree of agreement, the frequency of participation, and the order of evaluation, were treated as either binary variables or ordered categorical variables.</p>
        <p>Continuous variables were standardized, and categorical variables were split into multidimensional Boolean values before applying ML models. For each type of RSB, we used ML models to select and identify key variables to predict RSB among college students.</p>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>For descriptive statistics of baseline characteristics, continuous data were presented as the mean (SD) or the median (IQR), and the Student <italic>t</italic>-test or the Kruskal-Wallis test was applied depending on the normality distribution. Categorical data were presented in the form of counts with percentages, and the chi-square test or the Fisher exact test was applied. <italic>P</italic>&#60;.05 in a 2-tailed test was considered statistically significant in these tests. In addition, we developed multivariable mixed models with a logit link function to learn the specific linear relationship between RSB and the key variables screened by ML. The results were presented in the form of point estimates of coefficients and corresponding 95% CIs, and statistical significance was accepted when <italic>P</italic>&#60;.05.</p>
      </sec>
      <sec>
        <title>Model Development and Validation</title>
        <p>We used 8 ML approaches: multiple logistic regression (MLR), naive Bayes (BYS), linear discriminant analysis (LDA), random forest (RF), gradient boosting machine (GBM), extreme gradient boosting (XGBoost), deep learning (DL), and the ensemble model. The ensemble model used the average values of all other models’ predictive values to perform classification. The data set was split into a training set and a test set randomly in a ratio of 8:2, with 7035 (80%) samples in the training set and 1759 (20%) samples in the test set. Our models were built on the training set and then applied to the test set for RSB prediction. Model discrimination was assessed through the receiver operator characteristic (ROC) curve, and model performance was assessed through accuracy, precision, recall, <italic>F</italic><sub>1</sub>-score, the area under the receiver operator characteristic curve (AUROC), and the root-mean-square error (RMSE) calculated on the test set, which were presented in the form of the mean (SD).</p>
        <p>Through comparison, we chose the optimal model for RSB prediction and included the most predictable variables in the model. The appropriate number of predictable variables was determined by the turning points of the model performance indicators. If all indicators did not change significantly through statistical testing when a new variable was added, we considered the turning point to have been reached.</p>
        <p>To obtain the optimal performance for each model, we adopted the minimum distance (MD) method to select cut-off points to discriminate predictive values into 0 or 1. The MD method regarded the point closest to (0,1) on the ROC curve as the optimal cut-off point. To ensure the reliability and minimize the sensitivity of the results, we used a 10-fold cross-validation method to select the tuning hyperparameters as well as cut-off points. In addition, we repeated this process 10 times to minimize the influence of accidental circumstances.</p>
        <p>All models were generated using R version 4.0.3 (R Core Team and the R Foundation for Statistical Computing). We used the <italic>glmnet</italic> package for MLR, the <italic>e1071</italic> package for BYS, the <italic>MASS</italic> package for LDA, the <italic>randomForest</italic> package for the RF, the <italic>gbm</italic> package for GBM, the <italic>xgboost</italic> package for XGBoost, and the <italic>h20</italic> package for DL.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Ethical approval was obtained from the Institutional Review Board of Tsinghua University (IRB no. 20190083). All participants provided informed consent online, which was set before answering the questionnaire and emphasized the autonomy of participating and the ability to withdraw at any time. The privacy of personal information was protected throughout the study via anonymous data collection, and confidentiality was maintained by asking participants to provide honest answers. Eligible participation in this survey was voluntary and was not compensated.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Baseline Characteristics</title>
        <p>The baseline characteristics of the participants are shown in <xref ref-type="table" rid="table1">Table 1</xref>. Our sample covered all provincial-level administrative regions in China and achieved a relatively good balance in the sample division of eastern, central, western, and northeastern regions (n=4758, 54.11%, n=1484, 16.88%, n=2140, 24.33%, and n=412, 4.69%, respectively), as well as the sex ratio (males: n=3918, 44.55%; females: n=4876, 55.45%). A total of 8794 students were included, among which 3682 (41.87%) did not use contraception every time they engaged in sexual intercourse, 3602 (40.96%) did not use safe or effective contraceptive methods every time they engaged in sexual intercourse, 1157 (13.16%) had casual sex or sex with multiple partners, and 5328 (60.59%) had experience with at least 1 of those 3 former behaviors before. In addition, 307 (3.49%) participants did not use contraception and 2140 (24.33%) used ineffective or unsafe contraceptive methods during their last sexual intercourse, the details of which are shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The distribution of basic characteristics differed greatly in terms of RSB. Between the 2 groups with and without integrated RSB, the region of residence, sex, age, ethnicity, religious beliefs, urbanization of hometown, left-behind experience, migration experience, and self-assessment of family finances were significantly different (<italic>P</italic>&#60;.05) among college students.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Baseline characteristics of participants (N=8794) grouped by different types of RSB<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="220"/>
            <col width="120"/>
            <col width="150"/>
            <col width="160"/>
            <col width="160"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics</td>
                <td>Overall</td>
                <td>RSB type 1 (nonuse of contraception)<sup>b</sup></td>
                <td>RSB type 2 (ineffective or unsafe contraceptive method)<sup>c</sup></td>
                <td>RSB type 3 (casual sex or sex with multiple partners)<sup>d</sup></td>
                <td>RSB type 4 (integrated RSB)<sup>e</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  <bold>Region of residence, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>&#60;.001, <italic>P</italic><sub>3</sub>=.007, <italic>P</italic><sub>4</sub>&#60;.001<sup>f</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Eastern</td>
                <td>4758 (54.11)</td>
                <td>1770 (48.07)</td>
                <td>1779 (49.39)</td>
                <td>676 (58.43)</td>
                <td>2697 (50.62)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Central</td>
                <td>1484 (16.88)</td>
                <td>660 (17.93)</td>
                <td>627 (17.41)</td>
                <td>163 (14.09)</td>
                <td>910 (17.08)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Western</td>
                <td>2140 (24.33)</td>
                <td>1094 (29.71)</td>
                <td>1026 (28.48)</td>
                <td>263 (22.73)</td>
                <td>1476 (27.70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Northeastern</td>
                <td>412 (4.69)</td>
                <td>158 (4.29)</td>
                <td>170 (4.72)</td>
                <td>55 (4.75)</td>
                <td>245 (4.60)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Sex, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>=.15, <italic>P</italic><sub>3</sub>&#60;.001, <italic>P</italic><sub>4</sub>&#60;.001</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>3918 (44.55)</td>
                <td>1826 (49.59)</td>
                <td>1638 (45.47)</td>
                <td>646 (55.83)</td>
                <td>2573 (48.29)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>4876 (55.45)</td>
                <td>1856 (50.41)</td>
                <td>1964 (54.53)</td>
                <td>511 (44.17)</td>
                <td>2755 (51.71)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Self-assessed gender-role conformity<sup>g</sup>, n (%); <italic>P</italic><sub>1</sub>=.29, <italic>P</italic><sub>2</sub>=.70, <italic>P</italic><sub>3</sub>&#60;.001, <italic>P</italic><sub>4</sub>=.52</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Low</td>
                <td>277 (3.15)</td>
                <td>104 (2.82)</td>
                <td>109 (3.03)</td>
                <td>60 (5.19)</td>
                <td>177 (3.32)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Middle</td>
                <td>4158 (47.28)</td>
                <td>1759 (47.77)</td>
                <td>1720 (47.75)</td>
                <td>500 (43.22)</td>
                <td>2515 (47.20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td>4359 (49.57)</td>
                <td>1819 (49.40)</td>
                <td>1773 (49.22)</td>
                <td>597 (51.60)</td>
                <td>2636 (49.47)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), median (IQR); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>&#60;.001, <italic>P</italic><sub>3</sub>&#60;.001, <italic>P</italic><sub>4</sub>&#60;.001</td>
                <td>20.00 (19.00-21.00)</td>
                <td>20.00 (19.00-21.00)</td>
                <td>20.00 (19.00-21.00)</td>
                <td>20.00 (19.00-22.00)</td>
                <td>20.00 (19.00-21.00)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Ethnicity, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>&#60;.001, <italic>P</italic><sub>3</sub>=.77, <italic>P</italic><sub>4</sub>&#60;.001</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Han</td>
                <td>7902 (89.86)</td>
                <td>3240 (88.00)</td>
                <td>3164 (87.84)</td>
                <td>1043 (90.15)</td>
                <td>4698 (88.18)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Minority</td>
                <td>892 (10.14)</td>
                <td>442 (12.00)</td>
                <td>438 (12.16)</td>
                <td>114 (9.85)</td>
                <td>630 (11.82)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Religious beliefs, n (%); <italic>P</italic><sub>1</sub>=.005, <italic>P</italic><sub>2</sub>=.051, <italic>P</italic><sub>3</sub>=.17, <italic>P</italic><sub>4</sub>=.006</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>8039 (91.41)</td>
                <td>3329 (90.41)</td>
                <td>3267 (90.70)</td>
                <td>1045 (90.32)</td>
                <td>4835 (90.75)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>755 (8.59)</td>
                <td>353 (9.59)</td>
                <td>335 (9.30)</td>
                <td>112 (9.68)</td>
                <td>493 (9.25)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average monthly expenditure (CNY)/US $<sup>h</sup>, median (IQR); <italic>P</italic><sub>1</sub>=.29, <italic>P</italic><sub>2</sub>=.64, <italic>P</italic><sub>3</sub>&#60;.001, <italic>P</italic><sub>4</sub>=.47</td>
                <td>1800.00 (1200.00-2500.00)/265.48 (176.99-368.73)</td>
                <td>1800.00 (1200.00-2500.00)/265.48 (176.99-368.73)</td>
                <td>1800.00 (1200.00-2500.00)/265.48 (176.99-368.73)</td>
                <td>2000.00 (1500.00-3000.00)/294.98 (221.24-442.47)</td>
                <td>1800.00 (1200.00-2500.00)/265.48 (176.99-368.73)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Urbanization of hometown, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>=.16, <italic>P</italic><sub>3</sub>&#60;.001, <italic>P</italic><sub>4</sub>=.001</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urban</td>
                <td>4827 (54.89)</td>
                <td>1893 (51.41)</td>
                <td>1940 (53.86)</td>
                <td>745 (64.39)</td>
                <td>2846 (53.42)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Suburban</td>
                <td>2669 (30.35)</td>
                <td>1166 (31.67)</td>
                <td>1103 (30.62)</td>
                <td>281 (24.29)</td>
                <td>1644 (30.86)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rural</td>
                <td>1298 (14.76)</td>
                <td>623 (16.92)</td>
                <td>559 (15.52)</td>
                <td>131 (11.32)</td>
                <td>838 (15.73)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Left-behind experience, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>&#60;.001, <italic>P</italic><sub>3</sub>=.006, <italic>P</italic><sub>4</sub>&#60;.001</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>6184 (70.32)</td>
                <td>2426 (65.89)</td>
                <td>2450 (68.02)</td>
                <td>854 (73.81)</td>
                <td>3631 (68.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>2610 (29.68)</td>
                <td>1256 (34.11)</td>
                <td>1152 (31.98)</td>
                <td>303 (26.19)</td>
                <td>1697 (31.85)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Migration experience, n (%); <italic>P</italic><sub>1</sub>=.04, <italic>P</italic><sub>2</sub>&#60;.001, <italic>P</italic><sub>3</sub>=.14, <italic>P</italic><sub>4</sub>=.003</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>6864 (78.05)</td>
                <td>2830 (76.86)</td>
                <td>2738 (76.01)</td>
                <td>923 (79.78)</td>
                <td>4101 (76.97)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>1930 (21.95)</td>
                <td>852 (23.14)</td>
                <td>864 (23.99)</td>
                <td>234 (20.22)</td>
                <td>1227 (23.03)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Self-assessment of family finances<sup>i</sup>, n (%); <italic>P</italic><sub>1</sub>&#60;.001, <italic>P</italic><sub>2</sub>=.08, <italic>P</italic><sub>3</sub>=.14, <italic>P</italic><sub>4</sub>&#62;=.005</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Low</td>
                <td>652 (7.41)</td>
                <td>316 (8.58)</td>
                <td>293 (8.13)</td>
                <td>89 (7.69)</td>
                <td>434 (8.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Middle</td>
                <td>7167 (81.50)</td>
                <td>2985 (81.07)</td>
                <td>2904 (80.62)</td>
                <td>921 (79.60)</td>
                <td>4303 (80.76)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td>975 (11.09)</td>
                <td>381 (10.35)</td>
                <td>405 (11.24)</td>
                <td>147 (12.71)</td>
                <td>591 (11.09)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>RSB: risky sexual behavior.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Nonuse of contraception indicated that someone did not use contraception while having sex every time.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Ineffective or unsafe contraception indicated that someone often used unsafe contraceptive methods (eg, emergency contraception, external ejaculation, and safe period).</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>Casual sex or sex with multiple partners indicated that someone had engaged in casual sex or sex with multiple partners before.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Integrated RSB was the combination of the former 3 types of RSB.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup><italic>P</italic><sub>1</sub>, <italic>P</italic> value of RSB type 1; <italic>P</italic><sub>2</sub>, <italic>P</italic> value of RSB type 2; <italic>P</italic><sub>3</sub>, <italic>P</italic> value of RSB type 3; <italic>P</italic><sub>4</sub>, <italic>P</italic> value of RSB type 4.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>Self-assessed gender role conformity is a 1-7–ordered categorical-scale question. We classified the responses into 3 groups: low conformity (1-2), middle conformity (3-5), and high conformity (6-7).</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>CNY 1=US $0.145749.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>Self-assessment of family finances is a 1-7–ordered categorical-scale question. We classified the responses into 3 groups: low income (1-2), middle income (3-5), and high income (6-7).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Performance and Validation</title>
        <p>To precisely identify RSB among Chinese college students, we used various ML models to execute RSB prediction on the test data set to choose the optimal model. The model performance for the 4 types of RSB is presented in <xref ref-type="table" rid="table2">Table 2</xref>, and the model performance for the other 2 types of RSB based on the last sexual intercourse is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Through the comparison from multiple rounds of experiments, it was obvious that some ML models had better efficiency than the traditional multilinear logistic regression model. Compared to the performance of MLR (for which the average AUROCs were 0.76, 0.71, 0.91, and 0.79, respectively), XGBoost, GBM, and the RF presented better performance in terms of accuracy, the <italic>F</italic><sub>1</sub>-score, and the AUROC.</p>
        <p>To better understand model discrimination, we plotted ROC curves of all models on 4 types of RSB in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Similarly, ROC curves of the other 2 types of RSB based on the last time of sexual intercourse are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. It could be inferred that the curves of XGBoost and GBM were above the other curves, which suggests that these 2 models outperformed the others. Their average results were similar (average AUROCs were 0.77, 0.72, 0.94, and 0.80, respectively, in GBM and 0.78, 0.72, 0.94, and 0.80, respectively, in XGBoost). The ensemble model also played an effective role in predicting different types of RSB (average AUROCs were 0.77, 0.72, 0.93, and 0.80, respectively).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Model performance among different types of RSB<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="60"/>
            <col width="140"/>
            <col width="130"/>
            <col width="130"/>
            <col width="130"/>
            <col width="130"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>RSB</td>
                <td>Model</td>
                <td>Accuracy, mean (SD)</td>
                <td>Precision, mean (SD)</td>
                <td>Recall, mean (SD)</td>
                <td>F<sub>1</sub>-score, mean (SD)</td>
                <td>AUROC<sup>b</sup>, mean (SD)</td>
                <td>RMSE<sup>c</sup>, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Nonuse of contraception<sup>d</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="8">
                  <break/>
                </td>
                <td>MLR<sup>e</sup></td>
                <td>0.70 (0.01)</td>
                <td>0.63 (0.02)</td>
                <td>0.70 (0.02)</td>
                <td>0.66 (0.01)</td>
                <td>0.76 (0.01)</td>
                <td>0.44 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>BYS<sup>f</sup></td>
                <td>0.66 (0.01)</td>
                <td>0.58 (0.02)</td>
                <td>0.68 (0.02)</td>
                <td>0.62 (0.01)</td>
                <td>0.71 (0.01)</td>
                <td>0.53 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>LDA<sup>g</sup></td>
                <td>0.70 (0.01)</td>
                <td>0.63 (0.02)</td>
                <td>0.71 (0.02)</td>
                <td>0.66 (0.01)</td>
                <td>0.76 (0.01)</td>
                <td>0.44 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>RF<sup>h</sup></td>
                <td>0.71 (0.01)</td>
                <td>0.63 (0.02)</td>
                <td>0.72 (0.02)</td>
                <td>0.67 (0.01)</td>
                <td>0.77 (0.01)</td>
                <td>0.44 (0.00)</td>
              </tr>
              <tr valign="top">
                <td>GBM<sup>i</sup></td>
                <td>0.71 (0.01)</td>
                <td>0.64 (0.02)</td>
                <td>0.72 (0.02)</td>
                <td>0.67 (0.01)</td>
                <td>0.77 (0.01)</td>
                <td>1.07 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>XGBoost<sup>j</sup></td>
                <td>0.71 (0.01)</td>
                <td>0.63 (0.02)</td>
                <td>0.72 (0.03)</td>
                <td>0.67 (0.01)</td>
                <td>0.78 (0.01)</td>
                <td>0.44 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>DL<sup>k</sup></td>
                <td>0.65 (0.01)</td>
                <td>0.58 (0.02)</td>
                <td>0.65 (0.03)</td>
                <td>0.61 (0.01)</td>
                <td>0.70 (0.01)</td>
                <td>0.52 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>Ensemble</td>
                <td>0.71 (0.01)</td>
                <td>0.63 (0.02)</td>
                <td>0.73 (0.02)</td>
                <td>0.67 (0.01)</td>
                <td>0.77 (0.01)</td>
                <td>0.44 (0.01)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Ineffective or unsafe contraceptive method<sup>l</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="8">
                  <break/>
                </td>
                <td>MLR</td>
                <td>0.66 (0.01)</td>
                <td>0.57 (0.02)</td>
                <td>0.67 (0.02)</td>
                <td>0.62 (0.01)</td>
                <td>0.71 (0.01)</td>
                <td>0.46 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>BYS</td>
                <td>0.63 (0.01)</td>
                <td>0.54 (0.02)</td>
                <td>0.65 (0.04)</td>
                <td>0.59 (0.02)</td>
                <td>0.68 (0.01)</td>
                <td>0.53 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>LDA</td>
                <td>0.66 (0.01)</td>
                <td>0.58 (0.02)</td>
                <td>0.66 (0.03)</td>
                <td>0.62 (0.01)</td>
                <td>0.71 (0.01)</td>
                <td>0.46 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>RF</td>
                <td>0.67 (0.01)</td>
                <td>0.58 (0.02)</td>
                <td>0.67 (0.03)</td>
                <td>0.62 (0.01)</td>
                <td>0.72 (0.01)</td>
                <td>0.46 (0.00)</td>
              </tr>
              <tr valign="top">
                <td>GBM</td>
                <td>0.67 (0.01)</td>
                <td>0.59 (0.02)</td>
                <td>0.66 (0.03)</td>
                <td>0.62 (0.01)</td>
                <td>0.72 (0.01)</td>
                <td>1.08 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.67 (0.01)</td>
                <td>0.59 (0.02)</td>
                <td>0.67 (0.03)</td>
                <td>0.62 (0.01)</td>
                <td>0.72 (0.01)</td>
                <td>0.46 (0.00)</td>
              </tr>
              <tr valign="top">
                <td>DL</td>
                <td>0.61 (0.01)</td>
                <td>0.52 (0.02)</td>
                <td>0.6 (0.04)</td>
                <td>0.56 (0.02)</td>
                <td>0.65 (0.02)</td>
                <td>0.54 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>Ensemble</td>
                <td>0.67 (0.01)</td>
                <td>0.58 (0.02)</td>
                <td>0.67 (0.02)</td>
                <td>0.62 (0.01)</td>
                <td>0.72 (0.01)</td>
                <td>0.46 (0.01)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Casual sex or sex with multiple partners<sup>m</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="8">
                  <break/>
                </td>
                <td>MLR</td>
                <td>0.83 (0.02)</td>
                <td>0.44 (0.03)</td>
                <td>0.84 (0.02)</td>
                <td>0.57 (0.03)</td>
                <td>0.91 (0.01)</td>
                <td>0.26 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>BYS</td>
                <td>0.79 (0.02)</td>
                <td>0.37 (0.03)</td>
                <td>0.77 (0.03)</td>
                <td>0.5 (0.02)</td>
                <td>0.85 (0.01)</td>
                <td>0.36 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>LDA</td>
                <td>0.83 (0.01)</td>
                <td>0.43 (0.03)</td>
                <td>0.85 (0.02)</td>
                <td>0.57 (0.02)</td>
                <td>0.90 (0.01)</td>
                <td>0.27 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>RF</td>
                <td>0.87 (0.01)</td>
                <td>0.5 (0.03)</td>
                <td>0.87 (0.02)</td>
                <td>0.64 (0.03)</td>
                <td>0.94 (0.01)</td>
                <td>0.24 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>GBM</td>
                <td>0.87 (0.01)</td>
                <td>0.52 (0.03)</td>
                <td>0.88 (0.02)</td>
                <td>0.65 (0.02)</td>
                <td>0.94 (0.01)</td>
                <td>1.03 (0.00)</td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.88 (0.01)</td>
                <td>0.53 (0.03)</td>
                <td>0.88 (0.02)</td>
                <td>0.66 (0.02)</td>
                <td>0.94 (0.01)</td>
                <td>0.23 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>DL</td>
                <td>0.83 (0.02)</td>
                <td>0.43 (0.03)</td>
                <td>0.83 (0.02)</td>
                <td>0.57 (0.03)</td>
                <td>0.90 (0.01)</td>
                <td>0.29 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>Ensemble</td>
                <td>0.86 (0.02)</td>
                <td>0.48 (0.03)</td>
                <td>0.86 (0.02)</td>
                <td>0.62 (0.03)</td>
                <td>0.93 (0.01)</td>
                <td>0.24 (0.01)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Integrated RSB<sup>n</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="8">
                  <break/>
                </td>
                <td>MLR</td>
                <td>0.72 (0.01)</td>
                <td>0.80 (0.01)</td>
                <td>0.71 (0.02)</td>
                <td>0.75 (0.01)</td>
                <td>0.79 (0.01)</td>
                <td>0.43 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>BYS</td>
                <td>0.68 (0.01)</td>
                <td>0.76 (0.01)</td>
                <td>0.68 (0.03)</td>
                <td>0.72 (0.02)</td>
                <td>0.74 (0.01)</td>
                <td>0.56 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>LDA</td>
                <td>0.71 (0.01)</td>
                <td>0.79 (0.01)</td>
                <td>0.70 (0.02)</td>
                <td>0.74 (0.01)</td>
                <td>0.77 (0.01)</td>
                <td>0.44 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>RF</td>
                <td>0.73 (0.01)</td>
                <td>0.80 (0.01)</td>
                <td>0.73 (0.02)</td>
                <td>0.77 (0.01)</td>
                <td>0.79 (0.01)</td>
                <td>0.43 (0.00)</td>
              </tr>
              <tr valign="top">
                <td>GBM</td>
                <td>0.73 (0.01)</td>
                <td>0.81 (0.01)</td>
                <td>0.73 (0.02)</td>
                <td>0.77 (0.01)</td>
                <td>0.80 (0.01)</td>
                <td>1.05 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>XGBoost</td>
                <td>0.73 (0.01)</td>
                <td>0.81 (0.01)</td>
                <td>0.73 (0.02)</td>
                <td>0.77 (0.01)</td>
                <td>0.80 (0.01)</td>
                <td>0.43 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>DL</td>
                <td>0.67 (0.01)</td>
                <td>0.77 (0.01)</td>
                <td>0.66 (0.02)</td>
                <td>0.71 (0.01)</td>
                <td>0.73 (0.01)</td>
                <td>0.5 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>Ensemble</td>
                <td>0.73 (0.01)</td>
                <td>0.80 (0.01)</td>
                <td>0.74 (0.02)</td>
                <td>0.77 (0.01)</td>
                <td>0.79 (0.01)</td>
                <td>0.43 (0.01)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>RSB: risky sexual behavior.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>AUROC: area under the receiver operator characteristic curve.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>RMSE: root-mean-square error.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>Nonuse of contraception indicated that someone did not use contraception while having sex every time.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>MLR: multiple logistic regression.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>BYS: naive Bayes.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>LDA: linear discriminant analysis.</p>
            </fn>
            <fn id="table2fn8">
              <p><sup>h</sup>RF: random forest.</p>
            </fn>
            <fn id="table2fn9">
              <p><sup>i</sup>GBM: gradient boosting machine.</p>
            </fn>
            <fn id="table2fn10">
              <p><sup>j</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table2fn11">
              <p><sup>k</sup>DL: deep learning.</p>
            </fn>
            <fn id="table2fn12">
              <p><sup>l</sup>Ineffective or unsafe contraception indicated that someone often used unsafe contraceptive methods (eg, emergency contraception, external ejaculation, and safe period).</p>
            </fn>
            <fn id="table2fn13">
              <p><sup>m</sup>Casual sex or sex with multiple partners indicated that someone had engaged in casual sex or sex with multiple partners before.</p>
            </fn>
            <fn id="table2fn14">
              <p><sup>n</sup>Integrated RSB was the combination of the former 3 types of RSB.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>AUROC curves among the different types of RSB. AUROC: area under the receiver operator characteristic curve; BYS: naive Bayes; DL: deep learning; GBM: gradient boosting machine; LDA: linear discriminant analysis; LR: logistic regression; RF: random forest; RSB: risky sexual behavior; XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="publichealth_v9i1e41162_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Variable Selection and Prediction for RSB</title>
        <p>Through the comprehensive comparison of the evaluation indicators considering both efficiency and robustness, XGBoost was chosen to form the predicting model. To comprehensively predict RSB, we took integrated RSB as the outcome to select important variables, which were ranked in the order of importance according to the XGBoost model. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows the trend of 6 indicators as the number of variables increases, where points represent the average performance and lines represent the range. The turning points of the 6 indicators were 5th, 8th, 7th, 7th, 6th, and 12th, respectively. Thus, we finally chose 12 key variables for our prediction model, as presented in <xref rid="figure2" ref-type="fig">Figure 2</xref>. It could be inferred that RSB has multiple types of influencing factors, including relationship status, sexual knowledge, sexual attitudes, and previous sexual experience. The final prediction model we developed could estimate not only the probability of a student engaging in RSB but also the kind of RSB they were more likely to engage in.</p>
        <p>To explore the specific association between the outcome variables and the predictive factors identified through XGBoost, we finally performed MLR, and the results of integrated RSB are presented in <xref ref-type="table" rid="table3">Table 3</xref>. It could be inferred that the lack of sexual knowledge and a liberal sexual attitude significantly increased the risk of RSB. In addition, regarding intimate relationship status, compared to the non-single group, the single group had a higher risk of RSB. Previous sexual experience also had a great influence on RSB. The greater the number of people participants had sexual intercourse with, the higher their risk of RSB. The more convenient the availability of contraceptives was, the less risk students would show RSB. The results of the other three types of RSB are shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The 12 most predictive variables selected by the XGBoost model. XGBoost: extreme gradient boosting.</p>
          </caption>
          <graphic xlink:href="publichealth_v9i1e41162_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Association between integrated RSB<sup>a</sup> and its key variables through MLR<sup>b</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="500"/>
            <col width="160"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Variable and option</td>
                <td colspan="2">Coefficient estimate</td>
                <td colspan="2">SE</td>
                <td colspan="2"><italic>Z</italic> value</td>
                <td><italic>P</italic> value (&#62;&#124;<italic>Z</italic>&#124;)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual knowledge: ejaculation outside the body is a contraceptive method.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Wrong</td>
                <td>N/A<sup>c</sup></td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Right</td>
                <td>0.46</td>
                <td colspan="2">0.07</td>
                <td colspan="2">6.99</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual knowledge: having sex during a safe period is a contraceptive method.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Wrong</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Right</td>
                <td>0.23</td>
                <td colspan="2">0.06</td>
                <td colspan="2">3.55</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual knowledge: as long as the timing is right, external ejaculation can effectively prevent pregnancy.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Wrong</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Right</td>
                <td>0.42</td>
                <td colspan="2">0.06</td>
                <td colspan="2">–6.69</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual attitude: views on one-night stands or “booty calls.”</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I can accept it.</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I can understand my friends doing this, but I cannot.</td>
                <td>–0.44</td>
                <td colspan="2">0.07</td>
                <td colspan="2">–6.38</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Totally unacceptable.</td>
                <td>–0.28</td>
                <td colspan="2">0.07</td>
                <td colspan="2">–3.73</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual attitude: you don't have to wear a condom every time, because you don't always get pregnant without one.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Strongly disagree</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Relatively disagree</td>
                <td>1.05</td>
                <td colspan="2">0.07</td>
                <td colspan="2">15.09</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Not sure</td>
                <td>1.28</td>
                <td colspan="2">0.11</td>
                <td colspan="2">11.66</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Relatively agree</td>
                <td>1.68</td>
                <td colspan="2">0.17</td>
                <td colspan="2">9.76</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Strongly agree</td>
                <td>1.25</td>
                <td colspan="2">0.25</td>
                <td colspan="2">5.07</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Relationship status: your intimate relationship status.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nonsingle</td>
                <td>–0.39</td>
                <td colspan="2">0.06</td>
                <td colspan="2">–6.63</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual experience: having had penetrative sex (vaginal).</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Never has been and never will be acceptable.</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Never has been but I can accept it in the future.</td>
                <td>0.97</td>
                <td colspan="2">1.49</td>
                <td colspan="2">0.65</td>
                <td colspan="2">.52</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started before junior high school.</td>
                <td>1.42</td>
                <td colspan="2">1.42</td>
                <td colspan="2">1.00</td>
                <td colspan="2">.32</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started since senior high school.</td>
                <td>1.15</td>
                <td colspan="2">1.41</td>
                <td colspan="2">0.82</td>
                <td colspan="2">.42</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started since college.</td>
                <td>0.81</td>
                <td colspan="2">1.41</td>
                <td colspan="2">0.57</td>
                <td colspan="2">.57</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual experience: have you taken photos/videos during sex?</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Never has been and never will be acceptable.</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Never has been but I can accept it in the future.</td>
                <td>0.01</td>
                <td colspan="2">0.07</td>
                <td colspan="2">0.16</td>
                <td colspan="2">.87</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started before junior high school.</td>
                <td>0.17</td>
                <td colspan="2">0.35</td>
                <td colspan="2">0.49</td>
                <td colspan="2">.62</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started since senior high school.</td>
                <td>0.45</td>
                <td colspan="2">0.13</td>
                <td colspan="2">3.48</td>
                <td colspan="2">.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I started since college.</td>
                <td>0.46</td>
                <td colspan="2">0.07</td>
                <td colspan="2">6.32</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Sexual experience: age of partner with whom you first had penetrative sex.</td>
                <td colspan="2">0.01</td>
                <td colspan="2">0.01</td>
                <td colspan="2">1.38</td>
                <td>.17</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Sexual experience: the number of people you've had penetrative sex with.</td>
                <td colspan="2">0.33</td>
                <td colspan="2">0.02</td>
                <td colspan="2">13.93</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual experience: who is the decision maker regarding your contraceptive method?</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Myself.</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>My partner.</td>
                <td>0.17</td>
                <td colspan="2">0.09</td>
                <td colspan="2">2.01</td>
                <td colspan="2">.04</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>By mutual negotiation.</td>
                <td>0.11</td>
                <td colspan="2">0.06</td>
                <td colspan="2">1.82</td>
                <td colspan="2">.07</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>It depends.</td>
                <td>1.30</td>
                <td colspan="2">0.13</td>
                <td colspan="2">10.06</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Just use what we can find.</td>
                <td>0.84</td>
                <td colspan="2">0.23</td>
                <td colspan="2">3.67</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Others.</td>
                <td>–0.31</td>
                <td colspan="2">0.33</td>
                <td colspan="2">–0.93</td>
                <td colspan="2">.36</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Sexual experience: availability of contraceptives.</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Very convenient</td>
                <td>N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Relatively convenient</td>
                <td>0.30</td>
                <td colspan="2">0.06</td>
                <td colspan="2">5.41</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Relatively inconvenient</td>
                <td>0.41</td>
                <td colspan="2">0.08</td>
                <td colspan="2">4.91</td>
                <td colspan="2">&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Very inconvenient</td>
                <td>0.28</td>
                <td colspan="2">0.14</td>
                <td colspan="2">2.02</td>
                <td colspan="2"> .04</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>RSB: risky sexual behavior.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>MLR: multiple logistic regression.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>N/A: not applicable as the baseline group.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>This study validated the effectiveness of ML models in predicting RSB among college students through comparisons of multiple models. Among various ML models, XGBoost performed the best in this task, with a higher accuracy, precision, <italic>F</italic><sub>1</sub>-score, and AUROC performance than others. Thus, we eventually used XGBoost to identify the 12 most predictive factors for total RSB, including relationship status, sexual knowledge, sexual attitudes, and previous sexual experience. This systematic process of data modeling as well as the accuracy of the final results indicated that ML approaches could have considerable value in RSB prediction and intervention among college students.</p>
        <p>ML models were substantially superior to conventional regressions and should be recommended for more practical applications. Compared to the AUROC values of the MLR model (0.76, 0.71, 0.91, and 0.79 on the 4 types of RSB, respectively), XGBoost had a much higher effect in terms of AUROC values (0.78, 0.72, 0.94, and 0.80 on the 4 types of RSB, respectively). However, the capacity of explanation of MLR was nonnegligible. Thus, we finally used an MLR model again to investigate the linear association between outcomes and those important risk factors identified through XGBoost.</p>
        <p>In this study, demographic characteristics and socioeconomic status were found to be significant factors of RSBs. Adolescents who were from an ethnic minority background, held religious beliefs, or had a lower family financial status tended to engage in more RSBs. This may be due to the lack of sexual education resources or specific religious customs. In addition, it was worth noting that students who had migration experience or were from rural hometowns were associated with increased RSBs. This finding was consistent with previous research and reflects the persisting gap in adolescent sexual and reproductive health between urban and rural areas [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Correlated with a lower level of education and socioeconomic status, rural-to-urban adolescents had less exposure to sexual knowledge and sex education [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>In accordance with previous studies, romantic relationships were highly associated with RSB. It was found that college students with a romantic relationship had a significantly higher probability of using condoms during vaginal sex, oral sex, and anal sex [<xref ref-type="bibr" rid="ref23">23</xref>]. On the one hand, students not in romantic relationships usually had fewer condom-carrying practices and a higher occurrence of unplanned sex. On the other hand, according to Rosenthal et al [<xref ref-type="bibr" rid="ref31">31</xref>], rather than being concerned with the risk of STIs, students not in romantic relationships paid more attention to building intimacy through RSB, especially during casual sexual encounters. This is a worrisome mechanism since these students are more inclined to be unaware of each other’s health status, which could lead to a considerable risk of STIs.</p>
        <p>This study also validated the role of sexual attitude in RSB. The more tolerant the students were toward condom nonuse and one-night stand, the higher their probability of engaging in RSB. In fact, it was widely validated that sexual attitude plays the most predictive influence in predicting RSB [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], which could be illustrated through the theory of planned behavior (TPB) that attitude is an activator of behavior [<xref ref-type="bibr" rid="ref34">34</xref>]. Thus, sexual education should be facilitated to emphasize the importance and necessity of safe sex and dispel misunderstandings about it.</p>
        <p>In addition, students’ previous sexual experience also had a large influence on the possibility of RSB, such as the number of sexual partners, the decision maker regarding the contraceptive method, and whether to take photos/videos during sex. This finding is also rational since well-practiced behavior would more likely recur due to the natural automation of initiates and controls [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are some limitations in this study. First, all outcomes and predictors were self-reported by participants, which may have caused recall bias and nonresponse bias. Since some questions were sensitive, participants may not have been willing to provide correct answers, such as on previous sexual experience, experience of sexual harassment, and assault. Second, the measurement of contraception use did not differentiate between the types of contraceptive methods used by the study population. Different contraceptive methods serve different functions. Condom use can prevent both STIs and unwanted pregnancies, while hormonal contraception is only effective for pregnancy prevention. Although the vast majority of participants used condoms for contraception, the predictive accuracy of contraceptive effectiveness may still have been obscured in this study because of the lack of differentiation across methods. Third, the definition of casual sex and sex with multiple partners was not well specified. Though these 2 types of behavior were undoubtedly validated as RSBs, the risks of contracting STIs and unwanted pregnancy can be kept relatively low with correct condom use. Fourth, although ML models have better predictive performance than traditional regression models, their explanatory performance is much weaker. We performed MLR to compensate for this drawback, but multicollinearity may exist among those selected risk factors, which could lead to inaccurate estimation. In particular, we had a large scale of many questions, with much similarity among them. Thus, questions could be divided into clusters to decrease the variable dimensions as well as strengthen the explanatory power. Fifth, since our model relied on a cross-sectional questionnaire, the outcomes and predictors were questioned concurrently. Under the same time window, it is difficult to identify the sequence of events. There may be causal inversion problems between predictors and outcomes, and thus, the prospective predictive efficiency of the model is hard to validate.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>There are considerable methodological, theoretical, and practical implications of this study. From the methodological aspect, we adopted a scientific and rigorous process to generate an RSB-predictive model using ML methods, which constitutes a research gap and urgent work to be done. The selection of the model, the adjustment of parameters, the comparison of indicators, and the finalization of variable numbers are of high reference value in the methodology. From a theoretical perspective, we identified a series of risk factors for RSB. We provided additional evidence for the association of demographic characteristics and socioeconomic status with RSB. Critical factors influencing RSB were also explored, including sexual attitude, sexual knowledge, relationship status, and sexual experience. Through the results presented, a comprehensive and evidence-based guideline was formed to facilitate more precise interventions and prevent RSB among adolescents and young adults. From a practical perspective, we developed a predictive model to help identify RSB among college students. Due to privacy concerns and the stigmatization of sexual behavior, it is often difficult to investigate the real prevalence of RSB among adolescents. Using the 12 predictors identified here, the model can predict not only the probability of a student engaging in RSB but also what kind of RSB they are more likely to engage in. With such a model, our study allows for more targeted intervention and prevention of RSB in students before they contract STIs, and thus, these students will be better able to avoid the various negative consequences of RSB, including STIs and unwanted pregnancy.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>In summary, our study confirmed that ML approaches, especially XGBoost, have greater predictive effects for RSB than traditional regression models. Such ML-based assessment tools could generate new applications with considerable practical value, which would promote health at both the individual and the public level in the future.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary materials.</p>
        <media xlink:href="publichealth_v9i1e41162_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 472 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operator characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BYS</term>
          <def>
            <p>naive Bayes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DL</term>
          <def>
            <p>deep learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">GBM</term>
          <def>
            <p>gradient boosting machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LDA</term>
          <def>
            <p>linear discriminant analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MD</term>
          <def>
            <p>minimum distance</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MLR</term>
          <def>
            <p>multiple logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ROC</term>
          <def>
            <p>receiver operator characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">RMSE</term>
          <def>
            <p>root-mean-square error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">RSB</term>
          <def>
            <p>risky sexual behavior</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">STI</term>
          <def>
            <p>sexually transmitted infection</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to express gratitude to the China Family Planning Association and the China Youth Network for their support in data collection and to all the students who participated in this survey.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data that support the findings of this study are available upon reasonable request from the corresponding author (KT). The data are not publicly available due to research ethics board restrictions.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tilahun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mamo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Knowledge, attitude and practice towards risky sexual behaviors among secondary and preparatory students of Metu town, south western Ethiopia</article-title>
          <source>BMC Public Health</source>
          <year>2020</year>
          <month>09</month>
          <day>14</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>1394</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-020-09371-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-020-09371-4</pub-id>
          <pub-id pub-id-type="medline">32928174</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-020-09371-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7488992</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bellizzi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pichierri</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Menchini</surname>
              <given-names>Le</given-names>
            </name>
            <name name-style="western">
              <surname>Barry</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sotgiu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bassat</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>The impact of underuse of modern methods of contraception among adolescents with unintended pregnancies in 12 low- and middle-income countries</article-title>
          <source>J Glob Health</source>
          <year>2019</year>
          <month>12</month>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>020429</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31673342"/>
          </comment>
          <pub-id pub-id-type="doi">10.7189/jogh.09.020429</pub-id>
          <pub-id pub-id-type="medline">31673342</pub-id>
          <pub-id pub-id-type="pii">jogh-09-020429</pub-id>
          <pub-id pub-id-type="pmcid">PMC6815657</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>World Health Organization</collab>
          </person-group>
          <source>Adolescent Pregnancy</source>
          <access-date>2022-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/adolescent-pregnancy">https://www.who.int/news-room/fact-sheets/detail/adolescent-pregnancy</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>World Health Organization</collab>
          </person-group>
          <source>Contraception</source>
          <access-date>2022-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/health-topics/contraception#tab=tab_3">https://www.who.int/health-topics/contraception#tab=tab_3</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Apter</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Contraception options: aspects unique to adolescent and young adult</article-title>
          <source>Best Pract Res Clin Obstet Gynaecol</source>
          <year>2018</year>
          <month>04</month>
          <volume>48</volume>
          <fpage>115</fpage>
          <lpage>127</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bpobgyn.2017.09.010</pub-id>
          <pub-id pub-id-type="medline">29032945</pub-id>
          <pub-id pub-id-type="pii">S1521-6934(17)30144-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>[Perception on AIDS infection risk and condom use among 2785 college students having had sexual experience in Zhejiang Province]</article-title>
          <source>Zhonghua Liu Xing Bing Xue Za Zhi</source>
          <year>2006</year>
          <month>06</month>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>499</fpage>
          <lpage>502</lpage>
          <pub-id pub-id-type="medline">17152510</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Florence</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>Reported Condom Use in Students Enrolled in a Personal Health and Wellness Course</source>
          <year>2012</year>
          <access-date>2023-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://scholars.indstate.edu/bitstream/handle/10484/8210/Candace%20Florence.pdf?sequence=2&#38;isAllowed=y">https://scholars.indstate.edu/bitstream/handle/10484/8210/Candace%20Florence.pdf?sequence=2&#38;isAllowed=y</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>John-Leader</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pit</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Geosocial networking dating app usage and risky sexual behavior in young adults attending a music festival: cross-sectional questionnaire study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>15</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e21082</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e21082/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21082</pub-id>
          <pub-id pub-id-type="medline">33856354</pub-id>
          <pub-id pub-id-type="pii">v23i4e21082</pub-id>
          <pub-id pub-id-type="pmcid">PMC8085743</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thornton</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Frick</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>JV</given-names>
            </name>
            <name name-style="western">
              <surname>Wall Myers</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Steinberg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cauffman</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Risky sex, drugs, sensation seeking, and callous unemotional traits in justice-involved male adolescents</article-title>
          <source>J Clin Child Adolesc Psychol</source>
          <year>2019</year>
          <month>12</month>
          <day>13</day>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>68</fpage>
          <lpage>79</lpage>
          <pub-id pub-id-type="doi">10.1080/15374416.2017.1399398</pub-id>
          <pub-id pub-id-type="medline">29236522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Homma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Saewyc</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kishor</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The relationship between sexual abuse and risky sexual behavior among adolescent boys: a meta-analysis</article-title>
          <source>J Adolesc Health</source>
          <year>2012</year>
          <month>07</month>
          <volume>51</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22727072"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2011.12.032</pub-id>
          <pub-id pub-id-type="medline">22727072</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(12)00003-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4829388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Longo</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Ertl</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Pazienza</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Agiliga</surname>
              <given-names>AU</given-names>
            </name>
            <name name-style="western">
              <surname>Dillon</surname>
              <given-names>FR</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Associations among negative urgency, sensation seeking, alcohol use, self-esteem, and casual sexual behavior for college students</article-title>
          <source>Subst Use Misuse</source>
          <year>2020</year>
          <month>12</month>
          <day>26</day>
          <volume>55</volume>
          <issue>5</issue>
          <fpage>796</fpage>
          <lpage>805</lpage>
          <pub-id pub-id-type="doi">10.1080/10826084.2019.1703748</pub-id>
          <pub-id pub-id-type="medline">31876218</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Owen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fincham</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Short-term prospective study of hooking up among college students</article-title>
          <source>Arch Sex Behav</source>
          <year>2011</year>
          <month>04</month>
          <day>4</day>
          <volume>40</volume>
          <issue>2</issue>
          <fpage>331</fpage>
          <lpage>341</lpage>
          <pub-id pub-id-type="doi">10.1007/s10508-010-9697-x</pub-id>
          <pub-id pub-id-type="medline">21203816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anteneh</surname>
              <given-names>ZA</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and correlates of multiple sexual partnerships among private college students in Bahir Dar City, Northwest Ethiopia</article-title>
          <source>Sci J Public Health</source>
          <year>2013</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>9</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.11648/j.sjph.20130101.12</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Medina-Perucha</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Family</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dack</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with sexual risks and risk of STIs, HIV and other blood-borne viruses among women using heroin and other drugs: a systematic literature review</article-title>
          <source>AIDS Behav</source>
          <year>2019</year>
          <month>01</month>
          <day>2</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>222</fpage>
          <lpage>251</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30073636"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10461-018-2238-7</pub-id>
          <pub-id pub-id-type="medline">30073636</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10461-018-2238-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6342849</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mwaba</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thankian</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lwatula</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Risky sexual behaviour among university students</article-title>
          <source>Int STD Res Rev</source>
          <year>2016</year>
          <month>01</month>
          <day>10</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.9734/isrr/2016/25462</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Somba</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mbonile</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Obure</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mahande</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Sexual behaviour, contraceptive knowledge and use among female undergraduates' students of Muhimbili and Dar es Salaam Universities, Tanzania: a cross-sectional study</article-title>
          <source>BMC Womens Health</source>
          <year>2014</year>
          <month>08</month>
          <day>07</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>94</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcwomenshealth.biomedcentral.com/articles/10.1186/1472-6874-14-94"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6874-14-94</pub-id>
          <pub-id pub-id-type="medline">25099502</pub-id>
          <pub-id pub-id-type="pii">1472-6874-14-94</pub-id>
          <pub-id pub-id-type="pmcid">PMC4126911</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tuot</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chhea</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Saphonn</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with risky sexual behavior among unmarried most-at-risk young people in Cambodia</article-title>
          <source>AJPHR</source>
          <year>2014</year>
          <month>01</month>
          <day>7</day>
          <volume>2</volume>
          <issue>5</issue>
          <fpage>211</fpage>
          <lpage>220</lpage>
          <pub-id pub-id-type="doi">10.12691/ajphr-2-5-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adeoti</surname>
              <given-names>YF</given-names>
            </name>
          </person-group>
          <source>Predisposing Factors Influencing Risky Sexual Behaviours as Expressed by Undergraduates in Osun State Nigeria</source>
          <year>2016</year>
          <access-date>2023-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/PREDISPOSING-FACTORS-INFLUENCING-RISKY-SEXUAL-AS-BY-Adeoti/30ec975c0178833d67d79fb7b60b331c8a1ea831">https://tinyurl.com/2dnnzuch</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Amare</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yeneabat</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Amare</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A systematic review and meta-analysis of epidemiology of risky sexual behaviors in college and university students in Ethiopia</article-title>
          <source>J Environ Public Health</source>
          <year>2019</year>
          <month>03</month>
          <day>20</day>
          <volume>2019</volume>
          <fpage>4852130</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2019/4852130"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2019/4852130</pub-id>
          <pub-id pub-id-type="medline">31015844</pub-id>
          <pub-id pub-id-type="pmcid">PMC6446110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Seth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>DiClemente</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Association of depressive symptoms and substance use with risky sexual behavior and sexually transmitted infections among African American female adolescents seeking sexual health care</article-title>
          <source>Am J Public Health</source>
          <year>2015</year>
          <month>10</month>
          <volume>105</volume>
          <issue>10</issue>
          <fpage>2137</fpage>
          <lpage>2142</lpage>
          <pub-id pub-id-type="doi">10.2105/ajph.2014.302493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vasilenko</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Kugler</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Butera</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Lanza</surname>
              <given-names>ST</given-names>
            </name>
          </person-group>
          <article-title>Patterns of adolescent sexual behavior predicting young adult sexually transmitted infections: a latent class analysis approach</article-title>
          <source>Arch Sex Behav</source>
          <year>2015</year>
          <month>04</month>
          <day>22</day>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>705</fpage>
          <lpage>715</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24449152"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10508-014-0258-6</pub-id>
          <pub-id pub-id-type="medline">24449152</pub-id>
          <pub-id pub-id-type="pmcid">PMC4107199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Long</surname>
              <given-names>Lu</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Association between condom use and perspectives on contraceptive responsibility in different sexual relationships among sexually active college students in China: a cross-sectional study</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2019</year>
          <month>01</month>
          <volume>98</volume>
          <issue>1</issue>
          <fpage>e13879</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30608410"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000013879</pub-id>
          <pub-id pub-id-type="medline">30608410</pub-id>
          <pub-id pub-id-type="pii">00005792-201901040-00030</pub-id>
          <pub-id pub-id-type="pmcid">PMC6344162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ssewanyana</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sebena</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Petkeviciene</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lukács</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miovsky</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stock</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Condom use in the context of romantic relationships: a study among university students from 12 universities in four Central and Eastern European countries</article-title>
          <source>Eur J Contracept Reprod Health Care</source>
          <year>2015</year>
          <month>02</month>
          <day>09</day>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>350</fpage>
          <lpage>360</lpage>
          <pub-id pub-id-type="doi">10.3109/13625187.2014.1001024</pub-id>
          <pub-id pub-id-type="medline">25664484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Medland</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Fairley</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Predicting the diagnosis of HIV and sexually transmitted infections among men who have sex with men using machine learning approaches</article-title>
          <source>J Infect</source>
          <year>2021</year>
          <month>01</month>
          <volume>82</volume>
          <issue>1</issue>
          <fpage>48</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jinf.2020.11.007</pub-id>
          <pub-id pub-id-type="medline">33189772</pub-id>
          <pub-id pub-id-type="pii">S0163-4453(20)30702-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feller</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Using clinical notes and natural language processing for automated HIV risk assessment</article-title>
          <source>J Acquir Immune Defic Syndr</source>
          <year>2018</year>
          <month>02</month>
          <day>01</day>
          <volume>77</volume>
          <issue>2</issue>
          <fpage>160</fpage>
          <lpage>166</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29084046"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/QAI.0000000000001580</pub-id>
          <pub-id pub-id-type="medline">29084046</pub-id>
          <pub-id pub-id-type="pmcid">PMC5762388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gore</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Bloem</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Patton</surname>
              <given-names>GC</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Coffey</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sawyer</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Mathers</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Global burden of disease in young people aged 10–24 years: a systematic analysis</article-title>
          <source>Lancet</source>
          <year>2011</year>
          <month>06</month>
          <volume>377</volume>
          <issue>9783</issue>
          <fpage>2093</fpage>
          <lpage>2102</lpage>
          <pub-id pub-id-type="doi">10.1016/s0140-6736(11)60512-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>World Health Organization</collab>
          </person-group>
          <source>Older Adolescent (15 to 19 years) and Young Adult (20 to 24 years) Mortality</source>
          <access-date>2022-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/levels-and-trends-in-older-adolescent-(15-to-19-years)-and-young-adult-(20-to-24-years)-mortality">https://tinyurl.com/mt8hvbpy</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sudhinaraset</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Astone</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Migration and unprotected sex in Shanghai, China: correlates of condom use and contraceptive consistency across migrant and nonmigrant youth</article-title>
          <source>J Adolesc Health</source>
          <year>2012</year>
          <month>03</month>
          <volume>50</volume>
          <issue>3 Suppl</issue>
          <fpage>S68</fpage>
          <lpage>S74</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22340859"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2011.12.007</pub-id>
          <pub-id pub-id-type="medline">22340859</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(11)00665-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC4166512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Characteristics and determinants of sexual behavior among adolescents of migrant workers in Shangai (China)</article-title>
          <source>BMC Public Health</source>
          <year>2009</year>
          <month>06</month>
          <day>19</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>195</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/1471-2458-9-195"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2458-9-195</pub-id>
          <pub-id pub-id-type="medline">19538756</pub-id>
          <pub-id pub-id-type="pii">1471-2458-9-195</pub-id>
          <pub-id pub-id-type="pmcid">PMC2706248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zabin</surname>
              <given-names>LS</given-names>
            </name>
          </person-group>
          <article-title>Unmet needs for reproductive health knowledge among unmarried migrant youth</article-title>
          <source>J Reprod Contracept</source>
          <year>2008</year>
          <month>12</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>227</fpage>
          <lpage>238</lpage>
          <pub-id pub-id-type="doi">10.1016/s1001-7844(08)60025-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenthal</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gifford</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Safe sex or safe love: competing discourses?</article-title>
          <source>AIDS Care</source>
          <year>1998</year>
          <month>02</month>
          <day>27</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.1080/09540129850124569</pub-id>
          <pub-id pub-id-type="medline">9536200</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McEachan</surname>
              <given-names>RRC</given-names>
            </name>
            <name name-style="western">
              <surname>Conner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lawton</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Prospective prediction of health-related behaviours with the theory of planned behaviour: a meta-analysis</article-title>
          <source>Health Psychol Rev</source>
          <year>2011</year>
          <month>09</month>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>144</lpage>
          <pub-id pub-id-type="doi">10.1080/17437199.2010.521684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Albarracín</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Fishbein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Muellerleile</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Theories of reasoned action and planned behavior as models of condom use: a meta-analysis</article-title>
          <source>Psychol Bull</source>
          <year>2001</year>
          <month>01</month>
          <volume>127</volume>
          <issue>1</issue>
          <fpage>142</fpage>
          <lpage>161</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11271752"/>
          </comment>
          <pub-id pub-id-type="doi">10.1037/0033-2909.127.1.142</pub-id>
          <pub-id pub-id-type="medline">11271752</pub-id>
          <pub-id pub-id-type="pmcid">PMC4780418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bargh</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burrows</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Automaticity of social behavior: direct effects of trait construct and stereotype activation on action</article-title>
          <source>J Pers Soc Psychol</source>
          <year>1996</year>
          <volume>71</volume>
          <issue>2</issue>
          <fpage>230</fpage>
          <lpage>244</lpage>
          <pub-id pub-id-type="doi">10.1037/0022-3514.71.2.230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ouellette</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Habit and intention in everyday life: the multiple processes by which past behavior predicts future behavior</article-title>
          <source>Psychol Bull</source>
          <year>1998</year>
          <month>07</month>
          <volume>124</volume>
          <issue>1</issue>
          <fpage>54</fpage>
          <lpage>74</lpage>
          <pub-id pub-id-type="doi">10.1037/0033-2909.124.1.54</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
