<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="brief-report" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JPH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Public Health Surveill</journal-id>
      <journal-title>JMIR Public Health and Surveillance</journal-title>
      <issn pub-type="epub">2369-2960</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v3i3e59</article-id>
    <article-id pub-id-type="pmid">28912117</article-id>
    <article-id pub-id-type="doi">10.2196/publichealth.7909</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Short Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Short Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Sample Size Calculations for Population Size Estimation Studies Using Multiplier Methods With Respondent-Driven Sampling Surveys</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Sabin</surname>
          <given-names>Keith</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Johnston</surname>
          <given-names>Lisa</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Hladik</surname>
          <given-names>Wolfgang</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes">
      <name name-style="western">
        <surname>Fearon</surname>
        <given-names>Elizabeth</given-names>
      </name>
      <degrees>MSc, PhD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Department of Social and Environmental Health Research</institution>
        <institution>London School of Hygiene and Tropical Medicine</institution>
        <addr-line>15-17 Tavistock Place</addr-line>
        <addr-line>London, WC1H 9SH</addr-line>
        <country>United Kingdom</country>
        <phone>44 20 7927 2877</phone>
        <email>Elizabeth.Fearon@lshtm.ac.uk</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5574-251X</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Chabata</surname>
          <given-names>Sungai T</given-names>
        </name>
        <degrees>MSc</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7629-1543</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Thompson</surname>
          <given-names>Jennifer A</given-names>
        </name>
        <degrees>MSc</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-3068-3952</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Cowan</surname>
          <given-names>Frances M</given-names>
        </name>
        <degrees>MBBS, MSc, MD, FRCPE</degrees>
        <xref rid="aff3" ref-type="aff">3</xref>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3087-4422</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib5">
        <name name-style="western">
          <surname>Hargreaves</surname>
          <given-names>James R</given-names>
        </name>
        <degrees>MSc, PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-3509-3572</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>Department of Social and Environmental Health Research</institution>
    <institution>London School of Hygiene and Tropical Medicine</institution>  
    <addr-line>London</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>Department of Infectious Disease Epidemiology</institution>
    <institution>London School of Hygiene and Tropical Medicine</institution>  
    <addr-line>London</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff3">
      <sup>3</sup>
      <institution>Centre for Sexual Health and HIV/AIDS Research</institution>
      <addr-line>Harare</addr-line>
      <country>Zimbabwe</country>
    </aff>
    <aff id="aff4">
    <sup>4</sup>
    <institution>Department of International Public Health</institution>
    <institution>Liverpool School of Tropical Medicine</institution>  
    <addr-line>Liverpool</addr-line>
    <country>United Kingdom</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Elizabeth Fearon 
      <email>Elizabeth.Fearon@lshtm.ac.uk</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Jul-Sep</season><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>14</day>
      <month>09</month>
      <year>2017</year>
    </pub-date>
    <volume>3</volume>
    <issue>3</issue>
    <elocation-id>e59</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>24</day>
        <month>4</month>
        <year>2017</year>
      </date>
      <date date-type="rev-request">
        <day>23</day>
        <month>6</month>
        <year>2017</year>
      </date>
      <date date-type="rev-recd">
        <day>4</day>
        <month>8</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>7</day>
        <month>8</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Elizabeth Fearon, Sungai T Chabata, Jennifer A Thompson, Frances M Cowan, James R Hargreaves. Originally published in JMIR Public Health and Surveillance (http://publichealth.jmir.org), 14.09.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Public Health and Surveillance, is properly cited. The complete bibliographic information, a link to the original publication on http://publichealth.jmir.org, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://publichealth.jmir.org/2017/3/e59/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>While guidance exists for obtaining population size estimates using multiplier methods with respondent-driven sampling surveys, we lack specific guidance for making sample size decisions.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>To guide the design of multiplier method population size estimation studies using respondent-driven sampling surveys to reduce the random error around the estimate obtained.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>The population size estimate is obtained by dividing the number of individuals receiving a service or the number of unique objects distributed (<italic>M</italic>) by the proportion of individuals in a representative survey who report receipt of the service or object (<italic>P</italic>). We have developed an approach to sample size calculation, interpreting methods to estimate the variance around estimates obtained using multiplier methods in conjunction with research into design effects and respondent-driven sampling. We describe an application to estimate the number of female sex workers in Harare, Zimbabwe.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>There is high variance in estimates. Random error around the size estimate reflects uncertainty from <italic>M</italic> and <italic>P</italic>, particularly when the estimate of <italic>P</italic> in the respondent-driven sampling survey is low. As expected, sample size requirements are higher when the design effect of the survey is assumed to be greater.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>We suggest a method for investigating the effects of sample size on the precision of a population size estimate obtained using multipler methods and respondent-driven sampling. Uncertainty in the size estimate is high, particularly when <italic>P</italic> is small, so balancing against other potential sources of bias, we advise researchers to consider longer service attendance reference periods and to distribute more unique objects, which is likely to result in a higher estimate of <italic>P</italic> in the respondent-driven sampling survey.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>population surveillance</kwd>
      <kwd>sample size</kwd>
      <kwd>sampling studies</kwd>
      <kwd>surveys and questionnaires</kwd>
      <kwd>research design</kwd>
      <kwd>data collection</kwd>
      <kwd>sex workers</kwd>
      <kwd>HIV</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Population size estimates (PSE) for those most at risk for human immunodeficiency virus infection are crucial to make epidemic projections, allocate funding, and monitor coverage of prevention and care programs [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. However, these populations are frequently stigmatized and criminalized and it is often not feasible or practical to conduct a census. One approach to obtaining a PSE is to use multiplier methods, including the service multiplier method (SMM) and the unique object multiplier method (UOM). The former uses 2 sources of data: (1) a count of program attendance or receipt of a service targeted to the population in question, and (2) a representative survey of the population in which uptake of service can be determined. The latter is the same, except the count is of the number of recognizable objects distributed to a population in advance of a survey. Obtaining a random sample of a population lacking a sampling frame is challenging, but there has been guidance published on adapting one of the methods commonly in use, respondent-driven sampling (RDS) [<xref ref-type="bibr" rid="ref3">3</xref>], for use with the service multiplier method [<xref ref-type="bibr" rid="ref4">4</xref>]. </p>
      <p>While there has been research into sample size requirements for RDS surveys [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>], we lack guidance applied to sample size requirements when used to obtain a PSE with a multiplier method. Here, we report our approach in the context of preparing a protocol to estimate the number of female sex workers (FSW) in Harare, Zimbabwe using the SMM implemented with an RDS survey.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>We briefly outline multiplier method size estimation, the approach to estimating uncertainty in the resulting population size estimates, and integrate this with advice on design effects and sample size requirements for RDS surveys.</p>
      </sec>
      <sec>
        <title>Multiplier Method Population Size Estimation</title>
        <p>Multiplier methods use 2 sources of data to estimate population size as described above: (1) a count of unique individuals from the target population receiving a service or unique objects distributed among this population, <italic>M</italic>, and (2) a representative estimate of the proportion of the target population in receipt of the service or object, <italic>P</italic>. The count is divided by the proportion as in Equation 1 (<xref ref-type="fig" rid="figure1">Figure 1</xref>) to obtain the population size estimate.</p>
        <p>Johnston et al. [<xref ref-type="bibr" rid="ref4">4</xref>] suggest using the Delta method to estimate the variance of the PSE, which combines variance in <italic>P</italic> and variance in <italic>M</italic>. We assume that <italic>M</italic>, as a count of target population individuals on a roster or unique objects distributed to the target population, follows a Poisson distribution for which the mean and variance are equal to µM [<xref ref-type="bibr" rid="ref8">8</xref>].  The variance of <italic>P</italic> depends on the sample size of the RDS survey.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Equations for estimating population size, study sample size, and variance of the population size estimate.</p>
          </caption>
          <graphic xlink:href="publichealth_v3i3e59_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Sample Size Calculations</title>
        <p>RDS is a structured, peer-referral recruitment method assuming a model for estimating each participant’s probability of inclusion; thus, allowing weighting of responses to be used to approximate a random sample [<xref ref-type="bibr" rid="ref9">9</xref>]. Existing guidance for estimating proportions from a RDS survey suggests that the sample size required for a simple random sample must be multiplied by a design effect (DEFF) to account for the RDS design [<xref ref-type="bibr" rid="ref10">10</xref>]. Empirical reviews of RDS surveys have found most DEFFs to lie between 2 and 4, though some studies have found higher DEFFs [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. The sample size for the RDS survey used to estimate <italic>P</italic> can be calculated as Equation 2 (<xref ref-type="fig" rid="figure1">Figure 1</xref>) given that <italic>n</italic> is sample size, <italic>µ</italic><sub>P</sub> is the estimate for the proportion we wish to estimate, and <italic>se(P)</italic> is the standard error of <italic>P</italic>. Recognizing that PSE are often required for small sites, we additionally suggest using a sample size <italic>n</italic><sub>adj</sub> that has been corrected for an estimated finite population as Equation 3 (<xref ref-type="fig" rid="figure1">Figure 1</xref>), where <italic>N</italic> is the estimated population size.</p>
        <p>Rearranging Equation 2, and using <italic>n</italic><sub>adj</sub> as obtained in Equation 3, <italic>se(P)</italic> as corrected for finite population size can be calculated as Equation 4 (<xref ref-type="fig" rid="figure1">Figure 1</xref>), and the effect on the variance of the PSE can be obtained by inserting <italic>se(P)</italic> into Equation 5 (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The 95% confidence interval (CI) around the PSE can then be obtained by taking the square root of <italic>var(M/P),</italic> multiplying by 1.96 (assuming an approximately normal distribution) and subtracting/adding to the PSE.</p>
        <p>We examined the relationship between sample size, <italic>P</italic>, and the width of the 95% CI obtained for a population size estimate of 15,000, fixing this estimate so that <italic>M</italic> varied with <italic>P</italic>.</p>
      </sec>
      <sec>
        <title>Application to Estimating the Number of Female Sex Workers in Harare</title>
        <p>To estimate the number of FSW in Harare, we planned a RDS survey of FSW aged 18 and older who had resided in the city for at least the previous 6 months. For service data, we planned to use Sisters with a Voice clinic attendance records. FSW attending this clinic, which provides sexual and reproductive health services for self-identified FSW, are given unique identification numbers and their visits recorded and dated (described further elsewhere [<xref ref-type="bibr" rid="ref12">12</xref>]). For <italic>M</italic>, we planned to record the number of unique women attending in the 6 months prior to the survey.</p>
        <p>To identify a reasonable estimated FSW population size for sample size calculation, we used previous estimates from a systematic review of FSW prevalence among 15- to 49-year-old women in sites from sub-Saharan Africa (.07%–4.3%) and multiplied them by the number of women of this age in Harare [<xref ref-type="bibr" rid="ref13">13</xref>]. The 2012 Zimbabwe census estimates that 30.2% of the population of Harare is female aged 15 to 49, and that the total population of Harare is 2,123,132 [<xref ref-type="bibr" rid="ref14">14</xref>], giving a FSW population size in Harare of 4488 to 27,572, with a plausible midrange estimate of 15,000, or 2.3%, of the adult female population.</p>
        <p>We examined the number of sex workers who visited the program for different reference periods up to April 23, 2015 to generate likely values for  <italic>M</italic> and  <italic>P</italic> given an assumed PSE of 15,000. We then examined the impact of reference period on sample size requirements assuming these values of  <italic>M</italic> and  <italic>P</italic>. Finally, we investigated the effect of DEFF on the width of the 95% CIs around the PSE for different sample sizes of the RDS survey. We developed a Web-based tool to implement the methods described here [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Relationships Between RDS Survey Sample Size, P, M, and Width of the 95% Confidence Intervals</title>
        <p>For all values of <italic>P</italic> and <italic>M,</italic> increasing the RDS survey sample size decreases the width of the CI around the PSE, <xref ref-type="fig" rid="figure2">Figure 2</xref>. The precision of the PSE also varies by the values of <italic>P</italic> and <italic>M</italic>, such that much larger sample sizes would be required to estimate the PSE with the same level of precision if <italic>P</italic> is small rather than large (and correspondingly, <italic>M</italic> is small rather than large).</p>
        <p>In <xref ref-type="fig" rid="figure2">Figure 2</xref>, values of <italic>M</italic> are varied with <italic>P</italic> so that <italic>M</italic> / <italic>P</italic> is always equal to 15,000. For instance if <italic>P</italic>=.05, <italic>M</italic>=750, or if <italic>P</italic>=.4, <italic>M</italic>=6000.</p>
       


      </sec>
      <sec>
        <title>Application to Planning a Population Size Estimation Study</title>
        <p>For our Harare example, we were able to review earlier service attendance data to see how the value of <italic>M</italic> might depend on the reference period chosen. The value of <italic>M</italic> in turn affects the sample size required via the impact on <italic>P</italic>, as shown in <xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="fig" rid="figure3">Figure 3</xref>, which assume a population of 15,000 FSW in Harare. Depending on whether we chose a period of 1 or 24 months, we might be estimating a proportion of .006 or a proportion of .148. For a given sample size, the width of the 95% CI will increase if the reference period is shorter and <italic>P</italic> is smaller. Higher DEFFs increase the uncertainty around the PSE, <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p>
        <p>We used previous service attendance data to observe how <italic>M</italic> varied by reference period, and therefore to predict how our estimate of <italic>P</italic>, the proportion of women attending, might vary by the reference period we chose, see <xref ref-type="table" rid="table1">Table 1</xref>. <xref ref-type="fig" rid="figure3">Figure 3</xref> shows the relationship between these values of <italic>P</italic> with the width of the 95% CI’s around the PSE for different sample sizes.</p>
        <p>Based on changes in the width of the estimated 95% CIs with increasing sample size (<xref ref-type="fig" rid="figure3">Figure 3</xref>) and on choosing a reference period that would both reduce the likelihood of recall bias while preventing <italic>P</italic> from being too low, we chose a sample size of 1500 FSW for the RDS survey and a reference period for Sisters service attendance of 6 months, for which we estimated <italic>P</italic> would be approximately .06.</p>
        
 <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Sample size and width of 95% confidence interval around a fixed population size estimate of 15,000 for different values of <italic>P</italic> and <italic>M</italic>, assuming a design effect of 3.</p>
          </caption>
          <graphic xlink:href="publichealth_v3i3e59_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>



<table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Number of female sex workers attending the Sisters program and effect on <italic>P</italic> given the total female sex worker population = 15,000 in Harare.</p>
          </caption>
          <table width="840" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="260"/>
            <col width="290"/>
            <col width="290"/>
            <thead>
              <tr valign="top">
                <td>Reference period to April 23, 2015</td>
                <td>Number of unique female sex workers attending, M</td>
                <td>Estimated <italic>P</italic>, assuming population = 15,000</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td><bold>1 month</bold></td>
                <td>85</td>
                <td>.006</td>
              </tr>
              <tr valign="top">
                <td><bold>3 months</bold></td>
                <td>560</td>
                <td>.037</td>
              </tr>
              <tr valign="top">
                <td><bold>6 months</bold></td>
                <td>952</td>
                <td>.063</td>
              </tr>
              <tr valign="top">
                <td><bold>12 months</bold></td>
                <td>1542</td>
                <td>.103</td>
              </tr>
              <tr valign="top">
                <td><bold>24 months</bold></td>
                <td>2227</td>
                <td>.148</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Effect of reference period (variations in <italic>P</italic>), width of the 95% confidence interval around the population size estimate and sample size required for estimating the number of female sex workers in Harare.</p>
          </caption>
          <graphic xlink:href="publichealth_v3i3e59_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Sample size and width of 95% confidence intervals around a population size estimate of 15,000 female sex workers in Harare, for assumed reference period of 6 months and design effects (DEFF) of 2, 3, and 4.</p>
          </caption>
          <graphic xlink:href="publichealth_v3i3e59_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Summary and Discussion of Findings</title>
        <p>We have applied current guidance on RDS and multiplier methods to propose an approach to planning population size estimation studies and determining sample size. We have given an example using the SMM, similar principles of which can be applied to the UOM.</p>
        <p>Even for large sample sizes, 95% CIs around the PSE are wide. The uncertainty around the PSE is more sensitive to the uncertainty in <italic>P</italic> than in <italic>M</italic>, which is evident from the formula for <italic>var(M/P)</italic>. Researchers cannot choose a value of <italic>P</italic>, but they can encourage it to be higher by encouraging <italic>M</italic> to be higher. Concerned only with random error, it would improve the precision of the PSE to choose a longer reference period, and thus likely obtain a larger <italic>P</italic> in the case of the SMM, or to distribute a greater number of unique objects for the UOM. However, for the SMM this approach needs to be balanced against the potential for recall bias on estimation of <italic>P</italic>. It is also possible that the relationship between <italic>M</italic> and the reference period will differ across service types and according to whether individuals visit frequently or sporadically, and that bias in <italic>M</italic> might vary by reference period. If there are errors in unique identification of individuals in the service data, a longer reference period could lead to a higher likelihood of duplicate identification numbers, which would bias the PSE. For the UOM, care is needed to ensure that more objects distributed did not increase the likelihood of dependence between methods of distribution and RDS survey recruitment, a key source of potential bias.</p>
        <p>We used DEFFs of 2 to 4 in our sample size calculations, but it is possible that a higher value would be more appropriate. Previous research has found that high levels of homophily (similarity) between recruiters and recruitees in RDS surveys is associated with higher DEFFs [<xref ref-type="bibr" rid="ref7">7</xref>]. In SMM studies, the RDS survey is intended to measure program attendance, a characteristic that is likely to exhibit high homophily as it is a route by which participants might know and recruit each other. High homophily is also likely when the same social networks are used to distribute unique objects and to later recruit individuals to a RDS survey. Higher DEFFs might therefore be required, though in a previous population size estimation study of 9 communities in Zimbabwe, we found evidence of high homophily by program attendance for some sites but not all [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <p>RDS surveys must have sufficient recruitment waves in order to reach stable estimates. There should also be sufficient numbers of seed participants to reflect diversity of the target population [<xref ref-type="bibr" rid="ref16">16</xref>], concerns that need to be considered alongside the total sample size [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
      </sec>
      <sec>
        <title>Recommendations</title>
        <p>This short paper considers random error around size estimates and does not discuss a consideration of bias resulting from unmet assumptions of both the multiplier and RDS methods, which we consider elsewhere [<xref ref-type="bibr" rid="ref8">8</xref>]. We agree with advice that researchers should use more than one multiplier and more than one method of estimating population size [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. However, justification for sample size is often not given. Based on our findings, we strongly recommend conducting sample size calculations for estimating population size and considering the relationship between reference period or number of objects distributed and <italic>P</italic> for potential impact on uncertainty.</p>
      </sec>
    </sec>
  </body>
  <back>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CI</term>
          <def>
            <p>confidence interval</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DEFF</term>
          <def>
            <p>design effect</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FSW</term>
          <def>
            <p>female sex workers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">PSE</term>
          <def>
            <p>population size estimates</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RDS</term>
          <def>
            <p>respondent-driven sampling</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">SMM</term>
          <def>
            <p>service multiplier method</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">UOM</term>
          <def>
            <p>unique object multiplier method</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Measurement and Surveillance of Human Immunodeficiency Virus Epidemics Consortium (MeSH), which is funded by the Bill &#38; Melinda Gates Foundation (Funder ID OPP1120138). The Funder has not been involved in manuscript review or approval.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Holland</surname>
            <given-names>CE</given-names>
          </name>
          <name name-style="western">
            <surname>Kouanda</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Lougué</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Pitche</surname>
            <given-names>VP</given-names>
          </name>
          <name name-style="western">
            <surname>Schwartz</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Anato</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ouedraogo</surname>
            <given-names>HG</given-names>
          </name>
          <name name-style="western">
            <surname>Tchalla</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Yah</surname>
            <given-names>CS</given-names>
          </name>
          <name name-style="western">
            <surname>Kapesa</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ketende</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Beyrer</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Baral</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Using population-size estimation and cross-sectional survey methods to evaluate HIV service coverage among key populations in Burkina Faso and Togo</article-title>
        <source>Public Health Rep</source>  
        <year>2016</year>  
        <volume>131</volume>  
        <fpage>773</fpage>  
        <lpage>782</lpage>  
        <pub-id pub-id-type="doi">10.1177/0033354916677237</pub-id>
        <pub-id pub-id-type="medline">28123223</pub-id>
        <pub-id pub-id-type="pii">10.1177_0033354916677237</pub-id>
        <pub-id pub-id-type="pmcid">PMC5230836</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>UNAIDS/WHO Working Group on Global HIV/AIDS and STI Surveillance</collab>
        </person-group>
        <source>Guidelines on estimating the size of populations most at risk to HIV</source>  
        <year>2010</year>  
        <access-date>2017-08-21</access-date>
        <publisher-name>World Health Organization</publisher-name>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://apps.who.int/iris/bitstream/10665/44347/1/9789241599580_eng.pdf">http://apps.who.int/iris/bitstream/10665/44347/1/9789241599580_eng.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6ssi9wajd"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>World Health Organization</collab>
          <collab>UNAIDS</collab>
        </person-group>
        <source>Introduction to HIV/AIDS and sexually transmitted infection surveillance</source>  
        <year>2013</year>  
        <access-date>2017-08-21</access-date>
        <publisher-loc>Geneva</publisher-loc>
        <publisher-name>World Health Organization</publisher-name>
        <comment>Module 4 Introduction to respondent-driven sampling 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://applications.emro.who.int/dsaf/EMRPUB_2013_EN_1539.pdf">http://applications.emro.who.int/dsaf/EMRPUB_2013_EN_1539.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6ssjQ0yyO"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Johnston</surname>
            <given-names>LG</given-names>
          </name>
          <name name-style="western">
            <surname>Prybylski</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Raymond</surname>
            <given-names>HF</given-names>
          </name>
          <name name-style="western">
            <surname>Mirzazadeh</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Manopaiboon</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>McFarland</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Incorporating the service multiplier method in respondent-driven sampling surveys to estimate the size of hidden and hard-to-reach populations: case studies from around the world</article-title>
        <source>Sex Transm Dis</source>  
        <year>2013</year>  
        <volume>40</volume>  
        <fpage>304</fpage>  
        <lpage>310</lpage>  
        <pub-id pub-id-type="doi">10.1097/OLQ.0b013e31827fd650</pub-id>
        <pub-id pub-id-type="medline">23486495</pub-id>
        <pub-id pub-id-type="pii">00007435-201304000-00010</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wejnert</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>An empirical test of respondent-driven sampling: point estimates, variance, degree measures, and out-of-equilibrium data</article-title>
        <source>Sociol Methodol</source>  
        <year>2009</year>  
        <volume>39</volume>  
        <fpage>73</fpage>  
        <lpage>116</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20161130"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/j.1467-9531.2009.01216.x</pub-id>
        <pub-id pub-id-type="medline">20161130</pub-id>
        <pub-id pub-id-type="pmcid">PMC2743108</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Johnston</surname>
            <given-names>LG</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Silva-Santisteban</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Raymond</surname>
            <given-names>HF</given-names>
          </name>
        </person-group>
        <article-title>An empirical examination of respondent driven sampling design effects among HIV risk groups from studies conducted around the world</article-title>
        <source>AIDS Behav</source>  
        <year>2013</year>  
        <volume>17</volume>  
        <fpage>2202</fpage>  
        <lpage>2210</lpage>  
        <pub-id pub-id-type="doi">10.1007/s10461-012-0394-8</pub-id>
        <pub-id pub-id-type="medline">23297082</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wejnert</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Pham</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Krishna</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Le</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>DiNenno</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Estimating design effect and calculating sample size for respondent-driven sampling studies of injection drug users in the United States</article-title>
        <source>AIDS Behav</source>  
        <year>2012</year>  
        <volume>16</volume>  
        <fpage>797</fpage>  
        <lpage>806</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22350828"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s10461-012-0147-8</pub-id>
        <pub-id pub-id-type="medline">22350828</pub-id>
        <pub-id pub-id-type="pmcid">PMC3382647</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chabata</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>Estimating the size of the female sex worker population in urban and rural communities in Zimbabwe: Project Report for Masters of Science in Medical Statistics [master's thesis]</source>  
        <year>2015</year>  
        <publisher-loc>London, UK</publisher-loc>
        <publisher-name>London School of Hygiene and Tropical Medicine</publisher-name></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Heckathorn</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Respondent-driven sampling: a new approach to the study of hidden populations</article-title>
        <source>Social Problems</source>  
        <year>1997</year>  
        <volume>44</volume>  
        <fpage>174</fpage>  
        <lpage>199</lpage>  
        <pub-id pub-id-type="doi">10.2307/3096941</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salganik</surname>
            <given-names>MJ</given-names>
          </name>
        </person-group>
        <article-title>Variance estimation, design effects, and sample size calculations for respondent-driven sampling</article-title>
        <source>J Urban Health</source>  
        <year>2006</year>  
        <volume>83</volume>  
        <issue>6 Suppl</issue>  
        <fpage>i98</fpage>  
        <lpage>i112</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16937083"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s11524-006-9106-x</pub-id>
        <pub-id pub-id-type="medline">16937083</pub-id>
        <pub-id pub-id-type="pmcid">PMC1705515</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Goel</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Salganik</surname>
            <given-names>MJ</given-names>
          </name>
        </person-group>
        <article-title>Assessing respondent-driven sampling</article-title>
        <source>Proc Natl Acad Sci U S A</source>  
        <year>2010</year>  
        <volume>107</volume>  
        <fpage>6743</fpage>  
        <lpage>6747</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=20351258"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1073/pnas.1000261107</pub-id>
        <pub-id pub-id-type="medline">20351258</pub-id>
        <pub-id pub-id-type="pii">1000261107</pub-id>
        <pub-id pub-id-type="pmcid">PMC2872407</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hargreaves</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Mtetwa</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Davey</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Dirawo</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chidiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Benedikt</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Naperiela</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Wong-Gruenwald</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hanisch</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Magure</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Mugurungi</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Cowan</surname>
            <given-names>FM</given-names>
          </name>
        </person-group>
        <article-title>Cohort analysis of programme data to estimate HIV incidence and uptake of HIV-related services among female sex workers in Zimbabwe, 2009-14</article-title>
        <source>J Acquir Immune Defic Syndr</source>  
        <year>2015</year>  
        <pub-id pub-id-type="doi">10.1097/QAI.0000000000000920</pub-id>
        <pub-id pub-id-type="medline">26674371</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Vandepitte</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lyerla</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Dallabetta</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Crabbé</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Alary</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Buvé</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Estimates of the number of female sex workers in different regions of the world</article-title>
        <source>Sex Transm Infect</source>  
        <year>2006</year>  
        <volume>82 Suppl 3</volume>  
        <fpage>18</fpage>  
        <lpage>25</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16735288"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/sti.2006.020081</pub-id>
        <pub-id pub-id-type="medline">16735288</pub-id>
        <pub-id pub-id-type="pii">82/suppl_3/iii18</pub-id>
        <pub-id pub-id-type="pmcid">PMC2576726</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Zimbabwe National Statistics Agency</collab>
        </person-group>
        <source>Zimbabwe Population Census 2012</source>  
        <year>2012</year>  
        <access-date>2017-08-21</access-date>
        <publisher-loc>Harare</publisher-loc>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.zimstat.co.zw/sites/default/files/img/National_Report.pdf">http://www.zimstat.co.zw/sites/default/files/img/National_Report.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6sskC0EA2"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fearon</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <source>Planning a multiplier method population size estimation study with RDS: a tool for calculating width of the 95% confidence intervals for a given set of inputs 2017</source>  
        <year>2017</year>  
        <access-date>2017-08-30</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://fearone.shinyapps.io/rds_ss_shiny/">https://fearone.shinyapps.io/rds_ss_shiny/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6t6cmeWJO"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Johnston</surname>
            <given-names>LG</given-names>
          </name>
          <name name-style="western">
            <surname>Whitehead</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Simic-Lawson</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kendall</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Formative research to optimize respondent-driven sampling surveys among hard-to-reach populations in HIV behavioral and biological surveillance: lessons learned from four case studies</article-title>
        <source>AIDS Care</source>  
        <year>2010</year>  
        <volume>22</volume>  
        <fpage>784</fpage>  
        <lpage>792</lpage>  
        <pub-id pub-id-type="doi">10.1080/09540120903373557</pub-id>
        <pub-id pub-id-type="medline">20467937</pub-id>
        <pub-id pub-id-type="pii">922145866</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gile</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Handcock</surname>
            <given-names>MS</given-names>
          </name>
        </person-group>
        <article-title>Respondent-driven sampling: an assessment of current methodology</article-title>
        <source>Sociol Methodol</source>  
        <year>2010</year>  
        <volume>40</volume>  
        <fpage>285</fpage>  
        <lpage>327</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22969167"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/j.1467-9531.2010.01223.x</pub-id>
        <pub-id pub-id-type="medline">22969167</pub-id>
        <pub-id pub-id-type="pmcid">PMC3437336</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Abdul-Quader</surname>
            <given-names>AS</given-names>
          </name>
          <name name-style="western">
            <surname>Baughman</surname>
            <given-names>AL</given-names>
          </name>
          <name name-style="western">
            <surname>Hladik</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Estimating the size of key populations: current status and future possibilities</article-title>
        <source>Curr Opin HIV AIDS</source>  
        <year>2014</year>  
        <volume>9</volume>  
        <fpage>107</fpage>  
        <lpage>114</lpage>  
        <pub-id pub-id-type="doi">10.1097/COH.0000000000000041</pub-id>
        <pub-id pub-id-type="medline">24393694</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wesson</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Reingold</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>McFarland</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Theoretical and empirical comparisons of methods to estimate the size of hard-to-reach populations: a systematic review</article-title>
        <source>AIDS Behav</source>  
        <year>2017</year>  
        <pub-id pub-id-type="doi">10.1007/s10461-017-1678-9</pub-id>
        <pub-id pub-id-type="medline">28078496</pub-id>
        <pub-id pub-id-type="pii">10.1007/s10461-017-1678-9</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
