<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e46708</article-id>
      <article-id pub-id-type="pmid">37930785</article-id>
      <article-id pub-id-type="doi">10.2196/46708</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Optimal Look-Back Period to Identify True Incident Cases of Diabetes in Medical Insurance Data in the Chinese Population: Retrospective Analysis Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Sanchez</surname>
            <given-names>Travis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Khatami</surname>
            <given-names>Alireza </given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yang</surname>
            <given-names>Can</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Wenyi</given-names>
          </name>
          <degrees>BM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2059-6839</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Baohua</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-8588-3444</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>Shaobo</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-1922-3590</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Jingxin</given-names>
          </name>
          <degrees>BM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-1891-076X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ai</surname>
            <given-names>Limei</given-names>
          </name>
          <degrees>BM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-9818-5227</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Zhengyu</given-names>
          </name>
          <degrees>BM</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-3772-0741</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Wan</surname>
            <given-names>Xia</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Institute of Basic Medical Sciences</institution>
            <institution>Chinese Academy of Medical Science</institution>
            <addr-line>Dongdan Street, 5th</addr-line>
            <addr-line>Beijing, 100052</addr-line>
            <country>China</country>
            <phone>86 01065233870</phone>
            <email>xiawan@ibms.pumc.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0738-5631</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institute of Basic Medical Sciences</institution>
        <institution>Chinese Academy of Medical Science</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>School of Basic Medicine</institution>
        <institution>Peking Union Medical College</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Chinese Center for Disease Control and Prevention</institution>
        <institution>National Institute for Prevention and Control of Chronic Noncommunicable Diseases</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Weifang Medical Insurance Center</institution>
        <addr-line>Weifang</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Clinical Medicine</institution>
        <institution>Qingdao University Medical College</institution>
        <addr-line>Qingdao</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xia Wan <email>xiawan@ibms.pumc.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>11</month>
        <year>2023</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>e46708</elocation-id>
      <history>
        <date date-type="received">
          <day>22</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>4</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>26</day>
          <month>9</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Wenyi Yang, Baohua Wang, Shaobo Ma, Jingxin Wang, Limei Ai, Zhengyu Li, Xia Wan. Originally published in JMIR Public Health and Surveillance (https://publichealth.jmir.org), 06.11.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on https://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://publichealth.jmir.org/2023/1/e46708" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Accurate estimation of incidence and prevalence is vital for preventing and controlling diabetes. Administrative data (including insurance data) could be a good source to estimate the incidence of diabetes. However, how to determine the look-back period (LP) to remove cases with preceding records remains a problem for administrative data. A short LP will cause overestimation of incidence, whereas a long LP will limit the usefulness of a database. Therefore, it is necessary to determine the optimal LP length for identifying incident cases in administrative data.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to offer different methods to identify the optimal LP for diabetes by using medical insurance data from the Chinese population with reference to other diseases in the administrative data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Data from the insurance database of the city of Weifang, China from between January 2016 and December 2020 were used. To identify the incident cases in 2020, we removed prevalent patients with preceding records of diabetes between 2016 and 2019 (ie, a 4-year LP). Using this 4-year LP as a reference, consistency examination indexes (CEIs), including positive predictive values, the κ coefficient, and overestimation rate, were calculated to determine the level of agreement between different LPs and an LP of 4 years (the longest LP). Moreover, we constructed a retrograde survival function, in which survival (ie, incident cases) means not having a preceding record at the given time and the survival time is the difference between the date of the last record in 2020 and the most recent previous record in the LP. Based on the survival outcome and survival time, we established the survival function and survival hazard function. When the survival probability, S(t), remains stable, and survival hazard converges to zero, we obtain the optimal LP. Combined with the results of these two methods, we determined the optimal LP for Chinese diabetes patients.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The κ agreement was excellent (0.950), with a high positive predictive value (92.2%) and a low overestimation rate (8.4%) after a 2-year LP. As for the retrograde survival function, S(t) dropped rapidly during the first 1-year LP (from 1.00 to 0.11). At a 417-day LP, the hazard function reached approximately zero (h<sub>t</sub>=0.000459), S(t) remained at 0.10, and at 480 days, the frequency of S(t) did not increase. Combining the two methods, we found that the optimal LP is 2 years for Chinese diabetes patients.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The retrograde survival method and CEIs both showed effectiveness. A 2-year LP should be considered when identifying incident cases of diabetes using insurance data in the Chinese population.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>diabetes</kwd>
        <kwd>incident cases</kwd>
        <kwd>administrative data</kwd>
        <kwd>look-back period</kwd>
        <kwd>retrograde survival function</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diabetes is a severe, long-term disease that significantly impacts the lives of individuals, families, and societies worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. In the past 3 decades, the prevalence of type 2 diabetes has risen dramatically. About 422 million people worldwide have diabetes, and 1.5 million deaths are directly attributable to diabetes each year, as reported by World Health Organization in 2022. In 2013, China had the largest number of patients with diabetes and the second-highest spending on diabetes and its complications worldwide [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Therefore, to achieve global agreement and halt the worldwide rise in diabetes by 2025, it is crucial to prevent and control diabetes in China.</p>
      <p>An accurate estimate of incidence and prevalence plays a crucial role in properly preventing and controlling diabetes. Although large-scale and representative surveys could be used for precise estimation of incidence [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>], they are expensive, laborious, and time-consuming. Currently, only a few areas have established incident case surveillance systems for chronic diseases in China, and only for some chronic diseases (such as diabetes and hypertension), with short monitoring periods and few sample surveillance points, which limits their usefulness. An alternative method is to use administrative data, such as medical insurance data or disease registration data. Advantages of using these administrative data include easy access, low cost, and large sample size (covering the majority of residents), as well as the ability to follow up with participants longitudinally for many years; this has been confirmed by many researchers in other countries [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Since medical insurance reforms in 2012 [<xref ref-type="bibr" rid="ref12">12</xref>], China has vigorously promoted medical policies and expanded coverage of the population [<xref ref-type="bibr" rid="ref13">13</xref>]. Effective data have gradually accumulated during the past few years, making it possible to conduct research in this population.</p>
      <p>However, multiple records of the same patient make it a general challenge to identify true incident cases through medical insurance data, as it is difficult to define the starting point of certain diseases for a patient. Before the index year, a look-back (LP) period is used to deal with this problem. Patients with a diabetes diagnosis in the index year and without a diabetes diagnosis in the LP would be identified as incident cases. Until now, there has been no consensus on the length of the LP. An insufficient LP might cause overestimation of incidence [<xref ref-type="bibr" rid="ref14">14</xref>], whereas an overlong LP would limit the number of reporting years and the usefulness of the database. Researchers have found that different diseases have different LPs due to specific trajectories [<xref ref-type="bibr" rid="ref11">11</xref>]. For diabetes, Brameld et al [<xref ref-type="bibr" rid="ref15">15</xref>] identified an LP of 13 years using data from the Western Australian Data Linkage System, while Asghari et al identified an LP of 5 years using data from the Régie de l’assurance maladie du Québec [<xref ref-type="bibr" rid="ref7">7</xref>]. We believe that different patterns of medical contact cycles among countries may cause these different findings on LPs. However, there is no study on the optimal LP in the Chinese population for diabetes.</p>
      <p>In this study, we will use 2 methods to identify the optimal LP for diabetes in the Chinese population, using data from an insurance database for 2016 to 2020 obtained from the Medical Security Bureau (MSB) of the city of Weifang, China, as an example. Weifang, a prefecture-level city in Shandong province with 9.4 million long-term residents, has a systematic method for ensuring medical service, and the coverage rate for medical insurance reached 96.15% in 2021. The aim of this study is to identify the optimal LP for diabetes for the Chinese population and additionally to compare different results by using different methods to obtain a reference for other diseases in the administrative data.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>The proposal for this study was reviewed by Chinese Academy of Medical Science &#38; School of Basic Medicine (033-2018). The insurance claims data were obtained from the MSB of Weifang. In order to protect the privacy of patients, all personally identifiable information in the database is obfuscated.</p>
      </sec>
      <sec>
        <title>Data Sources</title>
        <p>The database used in this study included all in- or outpatient claim records of patients in Weifang for 2016 to 2020 provided by the local MSB. The social health insurance system covered approximately all residents in Weifang (close to 9 million individuals) during the period from 2016 to 2020. Each claim record contains (1) basic information about the patient, including personal identification number, gender, date of birth, and type of medical insurance; (2) medical information, including hospital name and code, admission and discharge time, and diagnosis of disease; and (3) details of medical service expenses, including total expenses, out-of-pocket expenses, and reimbursement expenses.</p>
      </sec>
      <sec>
        <title>Data Processing</title>
        <p>Firstly, due to the changes in the Weifang disease coding system and the special disease codes in outpatient chronic-disease records, the initial disease codes in the database were partly based on the International Classification of Diseases, 10th Revision (ICD-10). Therefore, the diagnoses were harmonized with the ICD-10 according to the code-disease mapping table provided by the MSB of Weifang. Later, records with critical missing information, such as gender (418/21,855,530, &#60;0.001%) or disease diagnosis (1,068,910/21,855,530, 4.89%), were deleted. The data processing is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow chart showing included and excluded records and the process used for data cleaning of the insurance claim data (January 1, 2016, to December 31, 2020). ICD-10: International Classification of Disease, 10th Revision.</p>
          </caption>
          <graphic xlink:href="publichealth_v9i1e46708_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Definition of Incident Diabetes for the Application of Different LPs</title>
        <p>First, we defined diabetes (ICD-10 codes E10-E14) cases as those with at least 1 inpatient claim record or 3 outpatient claim records with a diagnosis of diabetes, considering that inpatient records are more reliable than outpatient records [<xref ref-type="bibr" rid="ref16">16</xref>]. In this database, we found that all patients defined as having diabetes had more than 3 outpatient records, reflecting the regularity of medical contact.</p>
        <p>Second, we defined incident diabetes cases. The procedure to identify incident cases was to exclude cases with any in- or outpatient records of diabetes in the given LP, before the index year. Different LPs may classify patients as having different statuses. Two scenarios for assumed different LPs are shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. Scenario 1 (LP1) shows that patient B will be identified as an incident case but patient A will not. Scenario 2 (LP2) shows that with the extension of the LP, more records of patient B might be caught, but patient A and patient B will both be identified as prevalent cases. In order to use as long an LP as possible in this study, we used 2020 as the index year and a 4-year LP (2016-2019) as the longest LP.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Definition of incident cases under 2 scenarios. Scenario 1 (LP1): patient B will be identified as an incident case but patient A will not; scenario 2 (LP2): both patient A and patient B are not identified as incident diabetes cases. LP: look-back period.</p>
          </caption>
          <graphic xlink:href="publichealth_v9i1e46708_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>Two methods were developed to identify the optimal LP. First, consistency examination indexes (CEIs) were used to determine the level of agreement between different LPs from a quarter of a year to 4 years. Second, a retrograde survival function method was used. Finally, the optimal LP was selected after considering the results from the above approaches.</p>
        <p>The CEIs include the κ value, positive predictive values (PPVs), and overestimation value. The relative formulas have been reported in other papers [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. The κ value is categorized as follows: values between –1 and 0 represent “no agreement”; between 0 and 0.20 represent “poor agreement”; between 0.21 and 0.40 represent “slight agreement”; between 0.41 and 0.60 represent “fair agreement”; between 0.61 and 0.80 represent “good agreement”; between 0.81 and 0.90 represent “very good agreement”; and between 0.91 and 1.0 represent “excellent agreement” [<xref ref-type="bibr" rid="ref17">17</xref>]. The PPVs are used to estimate the probability of identifying a true incident case among those identified as being new cases [<xref ref-type="bibr" rid="ref18">18</xref>], calculated using the 4-year LP as the reference time. The overestimation of incident cases decreased with extension of the LP, which reflects the impact of the length of the LP impacts on the number of incident cases. All the CEIs mentioned above were calculated at quarter-year intervals during the first year of the LP and 1-year intervals after the first year, since the number of identified incident cases varied greatly within the first year of the LP in previous studies [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p>
        <p>With the retrograde survival function method, survival (ie, being an incident case) means not having a preceding record at the given time. In detail, for each record in this study, let <italic>a</italic> represent the date of the last record of diabetes of a patient in 2020, <italic>b</italic> the date of the most recent previous record in the LP, and <italic>c</italic> the first date of the LP. The retrograde survival time is (<italic>a</italic>–<italic>b</italic>) for patients with preceding records. Patients without preceding records during the LP, indicating survival, are defined as censored cases, with the censored time (<italic>a – c</italic>). Based on the survival time and censored time, we established the survival function. Survival probability, S(t), the probability of surviving at a specific time, is represented by the equation S(t)=P (T&#62;t), where <italic>T</italic> is the year of the LP, calculated using the Kaplan-Meier estimator. Then, we used the following 2 approaches to determine the optimal LP based on the survival function. For the first approach, we constructed a hazard function. The hazard function represents the instantaneous probability of having the end point event during (<italic>t,∆t</italic>) conditional on survival up to <italic>t</italic> or later. In actuarial terms, it is calculated by <inline-graphic xlink:href="publichealth_v9i1e46708_fig5.png" xlink:type="simple" mimetype="image"/>, where <italic>d<sub>∆t</sub></italic> is the number of patients with the previous record during (<italic>t,∆t</italic>) and <italic>n<sub>t</sub></italic> is the patient at risk during the interval. Since the retrograde hazard of diabetes will decrease and converge to zero and the survival function will converge to the “true” probability of being incident, we assumed that a time point (<italic>tf</italic>) exists where <inline-graphic xlink:href="publichealth_v9i1e46708_fig6.png" xlink:type="simple" mimetype="image"/>. At this point (<italic>tf</italic>), all cases with preceding records have been found, and the remaining cases are risk-free; this is exactly the optimal LP. To estimate (<italic>tf</italic>), for practical purposes, we defined (<italic>tf</italic>) as the first time point when h<sub>t</sub> ≤0.0005. For the second approach, we counted the frequency of S(t) corresponding to each day calculated by the retrograde survival function. We assumed that there was a stable S(t), where the frequency was high and increased significantly, representing that S(t) stays at S(<italic>t<sub>f</sub></italic>) relatively constantly over a long time and that the change in S(t) approaches zero. The t<sub>f</sub> will be considered as the point when S(t) first reaches S(<italic>t<sub>f</sub></italic>).</p>
        <p>Statistical analyses were performed using SAS (version 9.4; SAS institute).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>After removing records according to the criteria above, 16,132,023 records from medical insurance claims data from 2016 to 2020 were used in this study; these records came from 3,185,337 individuals. There were 3,600,089 records and 247,254 cases of diabetes in total. The insurance record history of 109,476 diabetes prevalent cases in 2020 was screened with the different LPs to identify incident cases. Inclusion and exclusion details are shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>, and basic information on the data is shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Basic information on the data used in this study (January 1, 2016, to December 31, 2020). “Insurance records” represents all claims and diabetes records in each year. “Individuals with insurance records” represents the number of persons with claims in each year. “Visits per capita” was calculated as the number of insurance records divided by the number of individuals with insurance records.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="130"/>
          <col width="140"/>
          <col width="140"/>
          <col width="0"/>
          <col width="140"/>
          <col width="140"/>
          <col width="0"/>
          <col width="140"/>
          <col width="140"/>
          <thead>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td colspan="3">Insurance records, n</td>
              <td colspan="3">Individuals with insurance records, n</td>
              <td colspan="2">Visits per capita, n</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>Inpatient</td>
              <td>Outpatient</td>
              <td colspan="2">Inpatient</td>
              <td>Outpatient</td>
              <td colspan="2">Inpatient</td>
              <td>Outpatient</td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Entire database</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2016</td>
              <td>1,227,374</td>
              <td>1,326,862</td>
              <td colspan="2">894,726</td>
              <td>128,819</td>
              <td colspan="2">1.37</td>
              <td>10.30</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2017</td>
              <td>1,459,273</td>
              <td>1,583,937</td>
              <td colspan="2">1,027,600</td>
              <td>151,130</td>
              <td colspan="2">1.42</td>
              <td>10.48</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2018</td>
              <td>1,484,065</td>
              <td>1,815,786</td>
              <td colspan="2">1,024,998</td>
              <td>168,547</td>
              <td colspan="2">1.45</td>
              <td>10.77</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2019</td>
              <td>1,559,320</td>
              <td>2,123,446</td>
              <td colspan="2">1,061,351</td>
              <td>196,294</td>
              <td colspan="2">1.47</td>
              <td>10.82</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2020</td>
              <td>1,393,165</td>
              <td>2,158,795</td>
              <td colspan="2">947,821</td>
              <td>220,560</td>
              <td colspan="2">1.47</td>
              <td>9.79</td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Diabetes cases</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2016</td>
              <td>26,597</td>
              <td>526,619</td>
              <td colspan="2">23,117</td>
              <td>58,703</td>
              <td colspan="2">1.15</td>
              <td>8.97</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2017</td>
              <td>31,053</td>
              <td>618,289</td>
              <td colspan="2">26,833</td>
              <td>67,542</td>
              <td colspan="2">1.16</td>
              <td>9.15</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2018</td>
              <td>31,668</td>
              <td>699,739</td>
              <td colspan="2">27,425</td>
              <td>75,361</td>
              <td colspan="2">1.15</td>
              <td>9.29</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2019</td>
              <td>34,131</td>
              <td>793,431</td>
              <td colspan="2">29,594</td>
              <td>87,197</td>
              <td colspan="2">1.15</td>
              <td>9.10</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2020</td>
              <td>30,604</td>
              <td>807,958</td>
              <td colspan="2">27,038</td>
              <td>97,396</td>
              <td colspan="2">1.13</td>
              <td>8.30</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>Applying the longest LP identified 19,086 incident cases of diabetes. Only 17% (19,087/109,476) of the prevalent patients in 2020 were identified as incident cases as they did not have preceding records for diabetes in the longest LP before 2020, revealing that around 80% (90,389/109,476) of patients in 2020 were not truly incident cases. The κ coefficient and PPVs for these results rose with extension of the LP. Agreement was good when a quarter-year LP (κ=0.751) was used, changing to very good (κ=0.899) and excellent (κ=0.950) when the 1-year and 2-year LPs were used. As for PPVs, to achieve a PPV of at least 90% (10% of false positives) [<xref ref-type="bibr" rid="ref19">19</xref>], an LP of 2 years was necessary. The overestimation rate decreased with the extension of the length of the LP and did so especially sharply during the 1-year LP. After a 2-year LP, the overestimation decreased by under 10%. In general, according to the results of these CEIs, the optimal LP is 2 years for the Chinese population. Detailed information on the CEIs is shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Positive predictive values, κ coefficients, and overestimation with different look-back periods, all of which represent the agreement between the incident cases with different look-back periods and the 4-year look-back period as the longest period. Incident cases are defined as those not having previous records in the corresponding look-back period.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="150"/>
          <col width="250"/>
          <col width="200"/>
          <col width="200"/>
          <col width="200"/>
          <thead>
            <tr valign="top">
              <td>LP<sup>a</sup> (years)</td>
              <td>Incident cases, n</td>
              <td>PPV<sup>b</sup>, %</td>
              <td>κ</td>
              <td>Overestimation, %</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>0.25</td>
              <td>29,407</td>
              <td>0.674</td>
              <td>0.751</td>
              <td>0.485</td>
            </tr>
            <tr valign="top">
              <td>0.5</td>
              <td>26,195</td>
              <td>0.756</td>
              <td>0.825</td>
              <td>0.323</td>
            </tr>
            <tr valign="top">
              <td>0.75</td>
              <td>24,172</td>
              <td>0.819</td>
              <td>0.876</td>
              <td>0.220</td>
            </tr>
            <tr valign="top">
              <td>1</td>
              <td>23,288</td>
              <td>0.850</td>
              <td>0.899</td>
              <td>0.176</td>
            </tr>
            <tr valign="top">
              <td>2</td>
              <td>21,472</td>
              <td>0.922</td>
              <td>0.950</td>
              <td>0.084</td>
            </tr>
            <tr valign="top">
              <td>3</td>
              <td>20,468</td>
              <td>0.968</td>
              <td>0.980</td>
              <td>0.033</td>
            </tr>
            <tr valign="top">
              <td>4</td>
              <td>19,806</td>
              <td>1</td>
              <td>N/A<sup>c</sup></td>
              <td>0</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>LP: look-back period.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>PPV: positive predictive value.</p>
          </fn>
          <fn id="table2fn3">
            <p><sup>c</sup>N/A: not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>The retrograde survival function graphically represented the exclusion, showing the greatest decrease during the first year of screening (<xref rid="figure3" ref-type="fig">Figure 3</xref>). During the first 1-year LP, S(t) dropped from 1.00 to 0.11 (365 days) rapidly. The more days were included in the LP, the more the survival function converged to the “true” probability of being incident [<xref ref-type="bibr" rid="ref18">18</xref>]. According to the hazard function, the first time point when h<sub>t</sub> ≤0.0005 was with a 417-day LP: h<sub>t</sub>=0.000459; S(t)=0.11. This meant that the derivative (slope) of the survival function tended toward zero at this time.</p>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>(A) Change in survival probability with LPs with different numbers of days. Survival probability represents the probability of being an incident case at a specific day in the LP, which is calculated using the Kaplan-Meier estimator. (B) Change in survival hazard with LPs with different numbers of days. Survival hazard represents the instantaneous probability of having the end point event. LP: look-back period.</p>
        </caption>
        <graphic xlink:href="publichealth_v9i1e46708_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>The results for frequency showed that the frequency of S(t) was small, from 1.00 to 0.13, indicating that S(t) changed greatly. A change in S(t) from 0.11 to 0.10 means that the frequency has significantly increased, from 169 to 408, which is more than double (<xref rid="figure4" ref-type="fig">Figure 4</xref>). This means that the risk for a preceding record at this time remained relatively constant at 0.10 over a very long time, and the first day when S(t) reached 0.10 was 480 days. Combining the results for frequency and hazard function, the retrograde survival function method showed that the optimal LP was more than 400 days, which is closest to 2 years.</p>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>The frequency of S(t). *The frequency of S(t) from 0.97 to 0.26 was between 1 and 3. LP: look-back period.</p>
        </caption>
        <graphic xlink:href="publichealth_v9i1e46708_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>When using 2 years as the optimal LP, there were 21,472 incident cases. The number of female patients (n=10,862) was a little more than that of male patients (n=10,610), and 84.74% (18,192/21,472) of incident cases were between the ages of 45 and 79 years (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Incident cases applying a 2-year look-back period (ie, using 2018 and 2019 to identify incident cases in 2020) with different ages and genders.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="250"/>
          <col width="250"/>
          <col width="250"/>
          <col width="250"/>
          <thead>
            <tr valign="top">
              <td>Age group (years)</td>
              <td>Male patients, n (n=10,610)</td>
              <td>Female patients, n (n=10,862)</td>
              <td>Total patients, n (n=21,472)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>0-4</td>
              <td>4</td>
              <td>7</td>
              <td>11</td>
            </tr>
            <tr valign="top">
              <td>5-9</td>
              <td>7</td>
              <td>16</td>
              <td>23</td>
            </tr>
            <tr valign="top">
              <td>10-14</td>
              <td>36</td>
              <td>29</td>
              <td>65</td>
            </tr>
            <tr valign="top">
              <td>15-19</td>
              <td>34</td>
              <td>23</td>
              <td>57</td>
            </tr>
            <tr valign="top">
              <td>20-24</td>
              <td>52</td>
              <td>45</td>
              <td>97</td>
            </tr>
            <tr valign="top">
              <td>25-29</td>
              <td>99</td>
              <td>63</td>
              <td>162</td>
            </tr>
            <tr valign="top">
              <td>30-34</td>
              <td>308</td>
              <td>194</td>
              <td>502</td>
            </tr>
            <tr valign="top">
              <td>35-39</td>
              <td>401</td>
              <td>178</td>
              <td>579</td>
            </tr>
            <tr valign="top">
              <td>40-44</td>
              <td>577</td>
              <td>271</td>
              <td>848</td>
            </tr>
            <tr valign="top">
              <td>45-49</td>
              <td>961</td>
              <td>538</td>
              <td>1499</td>
            </tr>
            <tr valign="top">
              <td>50-54</td>
              <td>1432</td>
              <td>1073</td>
              <td>2505</td>
            </tr>
            <tr valign="top">
              <td>55-59</td>
              <td>1806</td>
              <td>1720</td>
              <td>3526</td>
            </tr>
            <tr valign="top">
              <td>60-64</td>
              <td>1544</td>
              <td>1778</td>
              <td>3322</td>
            </tr>
            <tr valign="top">
              <td>65-69</td>
              <td>1504</td>
              <td>2061</td>
              <td>3565</td>
            </tr>
            <tr valign="top">
              <td>70-74</td>
              <td>1000</td>
              <td>1533</td>
              <td>2533</td>
            </tr>
            <tr valign="top">
              <td>75-79</td>
              <td>481</td>
              <td>764</td>
              <td>1245</td>
            </tr>
            <tr valign="top">
              <td>80-84</td>
              <td>269</td>
              <td>394</td>
              <td>663</td>
            </tr>
            <tr valign="top">
              <td>≥85</td>
              <td>95</td>
              <td>175</td>
              <td>270</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>In our study, a 2-year LP had good CEIs with excellent κ agreement (0.950&#62;0.9), a high PPV (92.2%) and a lower than 10% overestimation rate. As for the retrograde survival function, it showed that a 2-year LP can reliably distinguish new cases in a prevalent pool. According to the results of the methods above, we confirmed that the optimal LP for identifying incident cases of diabetes using the Chinese insurance database provided by the MSB of Weifang is around 2 years, and all the methods are effective and stable.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <sec>
          <title>Optimal Length of LP Compared to Other Work</title>
          <p>A 2-year LP for diabetes incident case identification using administrative data is the same length as used by a few previous studies [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. A study in Manitoba, Canada, also showed a probability of 0.96 for patients with diabetes to have subsequent medical contact for diabetes within 2 years [<xref ref-type="bibr" rid="ref22">22</xref>]. However, our results differ from those of Asghari et al [<xref ref-type="bibr" rid="ref7">7</xref>], who reported an LP of 5 years for health insurance data from Quebec, Canada. A possible reason might be different patterns and medical contact cycles among Chinese and Canadian populations caused by the different medical insurance policies. The hazard function figure (<xref rid="figure3" ref-type="fig">Figure 3</xref>B) reflects this difference. In our study, the hazard function was not monotonic, indicating that a few diabetes patients had medical contact irregularly in this database, unlike the Canadian insurance data. n addition, different judgment criteria on CEIs and h<sub>t</sub> in these studies might have caused the differences.</p>
        </sec>
        <sec>
          <title>Methodological Comparison</title>
          <p>As for retrograde survival function, Brameld et al [<xref ref-type="bibr" rid="ref15">15</xref>] chose a hazard rate under 0.00001 as the standard when using the retrograde survival method for identifying the optimal LP for diabetes, resulting in a 13-year optimal LP for diabetes among a group of LPs with the longest LP being 15 years, much longer than our study and most other studies [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. We think an overly strict standard may have caused an overly long LP. To avoid an overly long estimation of optimal LP, we used h<sub>t</sub> ≤0.0005 as the criterion, which is similar to the study by Asghari et al [<xref ref-type="bibr" rid="ref7">7</xref>], which showed that a 2-year LP was optimal for diabetes. That study defined the optimal LP as the time when S(t) was stable and constant [<xref ref-type="bibr" rid="ref7">7</xref>]; however, the authors did not provide a detailed definition for stable S(t), that is, S(t<sub>f</sub>). In our study, we tried a new approach. We counted the frequency of S(t) and defined S(t<sub>f</sub>) by the frequency of S(t) being greatest and increasing significantly.</p>
          <p>Regarding CEIs, such as the κ coefficient, PPVs, and overestimation rate, although they are convenient to calculate and used by many researchers, their criteria are not completely consistent between studies. The overestimation rate has been used by a few researchers to evaluate the impact of varying lengths of LP [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>], with values such as 10% [<xref ref-type="bibr" rid="ref11">11</xref>] and 20% [<xref ref-type="bibr" rid="ref21">21</xref>]. It is the same for PPVs, as some studies have chosen 80% as the evaluation criterion [<xref ref-type="bibr" rid="ref19">19</xref>], while some have chosen 90% [<xref ref-type="bibr" rid="ref28">28</xref>]. The criteria of the κ coefficient have generally between consistent (0.8 or 0.9) [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], but some researchers have considered that such high agreement may be related to the high number of prevalent cases of diabetes [<xref ref-type="bibr" rid="ref7">7</xref>]. Therefore, the effectiveness of κ may remain to be further verified.</p>
          <p>Because of the inconsistency of criteria, Beaudet et al [<xref ref-type="bibr" rid="ref18">18</xref>] chose to combine the results of κ and PPV to identify the optimal LP. In our study, we compared the results of the κ coefficient, PPV, the overestimation rate, and the retrograde survival method. We found that a κ coefficient of 0.9, 90% PPV, 10% overestimation, and 0.0005 hazard rate may be the most suitable criteria, returning stable and constant results, with a 2-year LP as the optimal period.</p>
          <p>In general, the CEIs were convenient to calculate, while retrograde survival curves showed the probability of “surviving” converging to the plateau, allowing us to obtain the optimal LP visually and quantitively. Moreover, the criteria of these methods are different. Previous studies have mostly used only one method for identifying the optimal LP, whereas 2 different methods, as used in this study, may lead to more robust results, which could then be referred to when analyzing LPs for other diseases in the administrative data.</p>
        </sec>
      </sec>
      <sec>
        <title>Number of Incident Diabetes Cases</title>
        <p>In our study, there were 109,467 diabetes cases in 2020 before LP adjustment. After using the 2-year LP, the number of incident cases decreased to 21,472, which means this adjustment is important. In addition, our study showed that 84.74% (18,192/21,472) of incident cases were between the ages of 45 to 79 years, indicating that the middle-aged and older population has a high incidence of diabetes. We should make efforts to focus on this population to prevent diabetes.</p>
      </sec>
      <sec>
        <title>Innovativeness</title>
        <p>Our study is the first to identify 2 years as the optimal LP for diabetes in the Chinese population when using insurance data, which supports efforts to estimate the incidence of diabetes among populations using insurance data. More importantly, we used 2 different methods to identify the optimal LP, a method that could be referred to when analyzing LPs for other diseases in administrative data.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has some limitations. In our database, without more detailed records for disease classification, it was not possible to differentiate between type 1 and type 2 diabetes. However, there are far fewer patients with type 1 diabetes than with type 2 diabetes in the overall population. Thus, we considered the study population to be generally homogeneous and that these results may be representative and stable. Furthermore, we only applied up to a 4-year LP. Although the results of the retrograde survival function analysis showed stabilization of risk of being a preceding case after a 2-year LP, we expect to use longer LPs in future studies with more accumulated data.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>All CEIs (the κ coefficient, PPV, and overestimation rate) and the retrograde survival function method can effectively identify the optimal LP for diabetes incident cases, with stable and constant results. We found that a 2-year LP was optimal to remove preceding diabetes cases and identify the true incidence of diabetes using medical insurance data in the Chinese population.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CEI</term>
          <def>
            <p>consistency examination index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ICD-10</term>
          <def>
            <p>International Classification of Diseases, 10th Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LP</term>
          <def>
            <p>look-back period</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MSB</term>
          <def>
            <p>Medical Security Bureau</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank all participants and staff of the Weifang Medical Insurance Center for their contributions to this work. The authors also acknowledge the contribution to this study of the Center for Disease Control and Prevention of Weifang City. The authors appreciate the support of the China Medical Board (CMB), which supported the CMB Collaborating Program in Burden of Diseases in China (15-208).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The insurance database used in this study is not publicly available due to a confidentiality agreement with Medical Security Bureau of Weifang but it is available from the corresponding author on reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeedi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Petersohn</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Salpea</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Malanda</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Karuranga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Unwin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Colagiuri</surname>
              <given-names>Stephen</given-names>
            </name>
            <name name-style="western">
              <surname>Guariguata</surname>
              <given-names>Leonor</given-names>
            </name>
            <name name-style="western">
              <surname>Motala</surname>
              <given-names>Ayesha A</given-names>
            </name>
            <name name-style="western">
              <surname>Ogurtsova</surname>
              <given-names>Katherine</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>Jonathan E</given-names>
            </name>
            <name name-style="western">
              <surname>Bright</surname>
              <given-names>Dominic</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>Rhys</given-names>
            </name>
          </person-group>
          <article-title>Global and regional diabetes prevalence estimates for 2019 and projections for 2030 and 2045: Results from the International Diabetes Federation Diabetes Atlas, 9 edition</article-title>
          <source>Diabetes Res Clin Pract</source>
          <year>2019</year>
          <month>11</month>
          <volume>157</volume>
          <fpage>107843</fpage>
          <pub-id pub-id-type="doi">10.1016/j.diabres.2019.107843</pub-id>
          <pub-id pub-id-type="medline">31518657</pub-id>
          <pub-id pub-id-type="pii">S0168-8227(19)31230-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and ethnic pattern of diabetes and prediabetes in China in 2013</article-title>
          <source>JAMA</source>
          <year>2017</year>
          <month>06</month>
          <day>27</day>
          <volume>317</volume>
          <issue>24</issue>
          <fpage>2515</fpage>
          <lpage>2523</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28655017"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2017.7596</pub-id>
          <pub-id pub-id-type="medline">28655017</pub-id>
          <pub-id pub-id-type="pii">2633917</pub-id>
          <pub-id pub-id-type="pmcid">PMC5815077</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and treatment of diabetes in China, 2013-2018</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>12</month>
          <day>28</day>
          <volume>326</volume>
          <issue>24</issue>
          <fpage>2498</fpage>
          <lpage>2506</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34962526"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2021.22208</pub-id>
          <pub-id pub-id-type="medline">34962526</pub-id>
          <pub-id pub-id-type="pii">2787545</pub-id>
          <pub-id pub-id-type="pmcid">PMC8715349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shibayama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Noguchi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tamiya</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Relationship between social engagement and diabetes incidence in a middle-aged population: Results from a longitudinal nationwide survey in Japan</article-title>
          <source>J Diabetes Investig</source>
          <year>2018</year>
          <month>09</month>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>1060</fpage>
          <lpage>1066</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29430865"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jdi.12820</pub-id>
          <pub-id pub-id-type="medline">29430865</pub-id>
          <pub-id pub-id-type="pmcid">PMC6123021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hawkins Carranza</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Corbatón-Anchuelo</surname>
              <given-names>Arturo</given-names>
            </name>
            <name name-style="western">
              <surname>Bermejo Pareja</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Martín-Arriscado Arroba</surname>
              <given-names>Cristina</given-names>
            </name>
            <name name-style="western">
              <surname>Vega-Quiroga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Benito-León</surname>
              <given-names>Julián</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano-Ríos</surname>
              <given-names>Manuel</given-names>
            </name>
          </person-group>
          <article-title>Incidence of type 2 diabetes in the elderly in Central Spain: Association with socioeconomic status, educational level, and other risk factors</article-title>
          <source>Prim Care Diabetes</source>
          <year>2022</year>
          <month>04</month>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>279</fpage>
          <lpage>286</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1751-9918(21)00232-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pcd.2021.12.016</pub-id>
          <pub-id pub-id-type="medline">35065897</pub-id>
          <pub-id pub-id-type="pii">S1751-9918(21)00232-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boonpor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Celis-Morales</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Association of self-reported walking pace with type 2 diabetes incidence in the UK Biobank Prospective Cohort Study</article-title>
          <source>Mayo Clin Proc</source>
          <year>2022</year>
          <month>09</month>
          <volume>97</volume>
          <issue>9</issue>
          <fpage>1631</fpage>
          <lpage>1640</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mayocp.2022.02.028</pub-id>
          <pub-id pub-id-type="medline">36058577</pub-id>
          <pub-id pub-id-type="pii">S0025-6196(22)00132-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asghari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Courteau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carpentier</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Vanasse</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Optimal strategy to identify incidence of diagnostic of diabetes using administrative data</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2009</year>
          <month>08</month>
          <day>28</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>62</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-9-62"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2288-9-62</pub-id>
          <pub-id pub-id-type="medline">19715586</pub-id>
          <pub-id pub-id-type="pii">1471-2288-9-62</pub-id>
          <pub-id pub-id-type="pmcid">PMC2745425</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mok</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Simard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dubé</surname>
              <given-names>Marjolaine</given-names>
            </name>
            <name name-style="western">
              <surname>Larocque</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Plante</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Legault</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Huot</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wafa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rahme</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nakhla</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Increasing incidence of type 1 and type 2 diabetes among Canadian children</article-title>
          <source>Can J Diabetes</source>
          <year>2022</year>
          <month>03</month>
          <volume>46</volume>
          <issue>2</issue>
          <fpage>189</fpage>
          <lpage>195</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jcjd.2021.08.006</pub-id>
          <pub-id pub-id-type="medline">35101343</pub-id>
          <pub-id pub-id-type="pii">S1499-2671(21)00226-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ortiz-Marrón</surname>
              <given-names>Honorato</given-names>
            </name>
            <name name-style="western">
              <surname>Del Pino Valero</surname>
              <given-names>Virginia</given-names>
            </name>
            <name name-style="western">
              <surname>Esteban-Vasallo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zorrilla Torras</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ordobás Gavín</surname>
              <given-names>María</given-names>
            </name>
          </person-group>
          <article-title>Evolution of the incidence of type 1 diabetes mellitus in the Community of Madrid, 1997-2016</article-title>
          <source>An Pediatr (Engl Ed)</source>
          <year>2021</year>
          <month>10</month>
          <volume>95</volume>
          <issue>4</issue>
          <fpage>253</fpage>
          <lpage>259</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2341-2879(21)00138-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.anpede.2020.08.011</pub-id>
          <pub-id pub-id-type="medline">34481795</pub-id>
          <pub-id pub-id-type="pii">S2341-2879(21)00138-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Purkiss</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Keegel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Vally</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wollersheim</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Estimates of drug treated diabetes incidence and prevalence using Australian administrative pharmaceutical data</article-title>
          <source>Int J Popul Data Sci</source>
          <year>2021</year>
          <month>05</month>
          <day>10</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>1398</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34007898"/>
          </comment>
          <pub-id pub-id-type="doi">10.23889/ijpds.v6i1.1398</pub-id>
          <pub-id pub-id-type="medline">34007898</pub-id>
          <pub-id pub-id-type="pii">S2399490821013987</pub-id>
          <pub-id pub-id-type="pmcid">PMC8121372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abbas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ihle</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Köster</surname>
              <given-names>Ingrid</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Estimation of disease incidence in claims data dependent on the length of follow-up: a methodological approach</article-title>
          <source>Health Serv Res</source>
          <year>2012</year>
          <month>04</month>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>746</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21958217"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1475-6773.2011.01325.x</pub-id>
          <pub-id pub-id-type="medline">21958217</pub-id>
          <pub-id pub-id-type="pmcid">PMC3419886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ercia</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The effects of private health insurance on universal health coverage objectives in China: A systematic literature review</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>03</month>
          <day>19</day>
          <volume>17</volume>
          <issue>6</issue>
          <fpage>2049</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17062049"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17062049</pub-id>
          <pub-id pub-id-type="medline">32204527</pub-id>
          <pub-id pub-id-type="pii">ijerph17062049</pub-id>
          <pub-id pub-id-type="pmcid">PMC7142974</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Boerma</surname>
              <given-names>Jt</given-names>
            </name>
            <name name-style="western">
              <surname>Barber</surname>
              <given-names>Sl</given-names>
            </name>
          </person-group>
          <article-title>Trends in access to health services and financial protection in China between 2003 and 2011: a cross-sectional study</article-title>
          <source>Lancet</source>
          <year>2012</year>
          <month>03</month>
          <day>03</day>
          <volume>379</volume>
          <issue>9818</issue>
          <fpage>805</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(12)60278-5</pub-id>
          <pub-id pub-id-type="medline">22386034</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(12)60278-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Czwikla</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jobski</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Schink</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The impact of the lookback period and definition of confirmatory events on the identification of incident cancer cases in administrative data</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2017</year>
          <month>08</month>
          <day>14</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>122</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-017-0407-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-017-0407-4</pub-id>
          <pub-id pub-id-type="medline">28806932</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-017-0407-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC5556662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brameld</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Holman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hobbs</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Improved methods for estimating incidence from linked hospital morbidity data</article-title>
          <source>Int J Epidemiol</source>
          <year>2003</year>
          <month>08</month>
          <volume>32</volume>
          <issue>4</issue>
          <fpage>617</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1093/ije/dyg191</pub-id>
          <pub-id pub-id-type="medline">12913039</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shau</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Sex- and age-specific prevalence and incidence rates of sight-threatening diabetic retinopathy in Taiwan</article-title>
          <source>JAMA Ophthalmol</source>
          <year>2014</year>
          <month>08</month>
          <volume>132</volume>
          <issue>8</issue>
          <fpage>922</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaophthalmol.2014.859</pub-id>
          <pub-id pub-id-type="medline">24809869</pub-id>
          <pub-id pub-id-type="pii">1868371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Byrt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bishop</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carlin</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Bias, prevalence and kappa</article-title>
          <source>J Clin Epidemiol</source>
          <year>1993</year>
          <month>05</month>
          <volume>46</volume>
          <issue>5</issue>
          <fpage>423</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/0895-4356(93)90018-v</pub-id>
          <pub-id pub-id-type="medline">8501467</pub-id>
          <pub-id pub-id-type="pii">0895-4356(93)90018-V</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beaudet</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Courteau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sarret</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vanasse</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Improving the selection of true incident cases of low back pain by screening retrospective administrative data</article-title>
          <source>Eur J Pain</source>
          <year>2014</year>
          <month>08</month>
          <volume>18</volume>
          <issue>7</issue>
          <fpage>923</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1002/j.1532-2149.2013.00437.x</pub-id>
          <pub-id pub-id-type="medline">24343901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vanasse</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Courteau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fleury</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Grégoire</surname>
              <given-names>Jean-Pierre</given-names>
            </name>
            <name name-style="western">
              <surname>Lesage</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moisan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Treatment prevalence and incidence of schizophrenia in Quebec using a population health services perspective: different algorithms, different estimates</article-title>
          <source>Soc Psychiatry Psychiatr Epidemiol</source>
          <year>2012</year>
          <month>04</month>
          <volume>47</volume>
          <issue>4</issue>
          <fpage>533</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1007/s00127-011-0371-y</pub-id>
          <pub-id pub-id-type="medline">21445625</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koo</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The incidence and prevalence of diabetes mellitus and related atherosclerotic complications in Korea: a National Health Insurance Database Study</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e110650</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0110650"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0110650</pub-id>
          <pub-id pub-id-type="medline">25329714</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-16213</pub-id>
          <pub-id pub-id-type="pmcid">PMC4199756</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenlund</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ekström</surname>
              <given-names>Nils</given-names>
            </name>
            <name name-style="western">
              <surname>Törnblom</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Wintzell</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Stark</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Titievsky</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Impact of variable look-back periods on the incidence rates of chronic diseases using real world data</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2020</year>
          <month>09</month>
          <volume>29</volume>
          <issue>9</issue>
          <fpage>1086</fpage>
          <lpage>1092</lpage>
          <pub-id pub-id-type="doi">10.1002/pds.5066</pub-id>
          <pub-id pub-id-type="medline">32648308</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blanchard</surname>
              <given-names>J F</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wajda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kendall</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Depew</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Incidence and prevalence of diabetes in Manitoba, 1986-1991</article-title>
          <source>Diabetes Care</source>
          <year>1996</year>
          <month>08</month>
          <volume>19</volume>
          <issue>8</issue>
          <fpage>807</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.2337/diacare.19.8.807</pub-id>
          <pub-id pub-id-type="medline">8842595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andes</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Gregg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rolka</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Diabetes prevalence and incidence among Medicare beneficiaries - United States, 2001-2015</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>68</volume>
          <issue>43</issue>
          <fpage>961</fpage>
          <lpage>966</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15585/mmwr.mm6843a2"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.mm6843a2</pub-id>
          <pub-id pub-id-type="medline">31671084</pub-id>
          <pub-id pub-id-type="pmcid">PMC6822811</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bratu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McLinden</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kooij</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Trigg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sereda</surname>
              <given-names>Paul</given-names>
            </name>
            <name name-style="western">
              <surname>Nanditha</surname>
              <given-names>Ni Gusti Ayu</given-names>
            </name>
            <name name-style="western">
              <surname>Lima</surname>
              <given-names>Viviane</given-names>
            </name>
            <name name-style="western">
              <surname>Guillemi</surname>
              <given-names>Silvia</given-names>
            </name>
            <name name-style="western">
              <surname>Salters</surname>
              <given-names>Kate</given-names>
            </name>
            <name name-style="western">
              <surname>Hogg</surname>
              <given-names>Robert</given-names>
            </name>
          </person-group>
          <article-title>Incidence of diabetes mellitus among people living with and without HIV in British Columbia, Canada between 2001 and 2013: a longitudinal population-based cohort study</article-title>
          <source>BMJ Open</source>
          <year>2021</year>
          <month>05</month>
          <day>11</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>e048744</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33980535"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2021-048744</pub-id>
          <pub-id pub-id-type="medline">33980535</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2021-048744</pub-id>
          <pub-id pub-id-type="pmcid">PMC8118079</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Blachley</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Musch</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Identification of persons with incident ocular diseases using health care claims databases</article-title>
          <source>Am J Ophthalmol</source>
          <year>2013</year>
          <month>12</month>
          <volume>156</volume>
          <issue>6</issue>
          <fpage>1169</fpage>
          <lpage>1175.e3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23972306"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ajo.2013.06.035</pub-id>
          <pub-id pub-id-type="medline">23972306</pub-id>
          <pub-id pub-id-type="pii">S0002-9394(13)00462-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC3836859</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schmedt</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Khil</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Riedel</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Incidence of multiple sclerosis in Germany: A cohort study applying different case definitions based on claims data</article-title>
          <source>Neuroepidemiology</source>
          <year>2017</year>
          <volume>49</volume>
          <issue>3-4</issue>
          <fpage>91</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1159/000481990</pub-id>
          <pub-id pub-id-type="medline">29136628</pub-id>
          <pub-id pub-id-type="pii">000481990</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Camplain</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kucharska-Newton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cuthbertson</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Alonso</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heiss</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Misclassification of incident hospitalized and outpatient heart failure in administrative claims data: the Atherosclerosis Risk in Communities (ARIC) study</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2017</year>
          <month>04</month>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>421</fpage>
          <lpage>428</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28120359"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.4162</pub-id>
          <pub-id pub-id-type="medline">28120359</pub-id>
          <pub-id pub-id-type="pmcid">PMC5380482</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benchimol</surname>
              <given-names>EI</given-names>
            </name>
            <name name-style="western">
              <surname>Guttmann</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mack</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>GC</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Gregor</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Forster</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Manuel</surname>
              <given-names>DG</given-names>
            </name>
          </person-group>
          <article-title>Validation of international algorithms to identify adults with inflammatory bowel disease in health administrative data from Ontario, Canada</article-title>
          <source>J Clin Epidemiol</source>
          <year>2014</year>
          <month>08</month>
          <volume>67</volume>
          <issue>8</issue>
          <fpage>887</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclinepi.2014.02.019</pub-id>
          <pub-id pub-id-type="medline">24774473</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(14)00083-3</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
