<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PONE-D-18-06181</article-id>
<article-id pub-id-type="doi">10.1371/journal.pone.0208795</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Social sciences</subject><subj-group><subject>Economics</subject><subj-group><subject>Economic models</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Body fluids</subject><subj-group><subject>Blood</subject><subj-group><subject>Blood counts</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Anatomy</subject><subj-group><subject>Body fluids</subject><subj-group><subject>Blood</subject><subj-group><subject>Blood counts</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Body fluids</subject><subj-group><subject>Blood</subject><subj-group><subject>Blood counts</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Body fluids</subject><subj-group><subject>Blood</subject><subj-group><subject>Blood counts</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>People and places</subject><subj-group><subject>Population groupings</subject><subj-group><subject>Age groups</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Clinical trials</subject><subj-group><subject>Randomized controlled trials</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Pharmacology</subject><subj-group><subject>Drug research and development</subject><subj-group><subject>Clinical trials</subject><subj-group><subject>Randomized controlled trials</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Clinical trials</subject><subj-group><subject>Randomized controlled trials</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Arithmetic</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Microbiology</subject><subj-group><subject>Medical microbiology</subject><subj-group><subject>Microbial pathogens</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Immunodeficiency viruses</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Pathology and laboratory medicine</subject><subj-group><subject>Pathogens</subject><subj-group><subject>Microbial pathogens</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Immunodeficiency viruses</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Organisms</subject><subj-group><subject>Viruses</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Immunodeficiency viruses</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Organisms</subject><subj-group><subject>Viruses</subject><subj-group><subject>Immunodeficiency viruses</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Organisms</subject><subj-group><subject>Viruses</subject><subj-group><subject>RNA viruses</subject><subj-group><subject>Retroviruses</subject><subj-group><subject>Lentivirus</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Microbiology</subject><subj-group><subject>Medical microbiology</subject><subj-group><subject>Microbial pathogens</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Retroviruses</subject><subj-group><subject>Lentivirus</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Pathology and laboratory medicine</subject><subj-group><subject>Pathogens</subject><subj-group><subject>Microbial pathogens</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Retroviruses</subject><subj-group><subject>Lentivirus</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Organisms</subject><subj-group><subject>Viruses</subject><subj-group><subject>Viral pathogens</subject><subj-group><subject>Retroviruses</subject><subj-group><subject>Lentivirus</subject><subj-group><subject>HIV</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Infectious diseases</subject><subj-group><subject>Viral diseases</subject><subj-group><subject>AIDS</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Diagnostic medicine</subject><subj-group><subject>HIV diagnosis and management</subject></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>Sensitivity analyses for effect modifiers not observed in the target population when generalizing treatment effects from a randomized controlled trial: Assumptions, models, effect scales, data scenarios, and implementation details</article-title>
<alt-title alt-title-type="running-head">Sensitivity to unobserved effect modifiers in generalizability</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<name name-style="western">
<surname>Nguyen</surname> <given-names>Trang Quynh</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-2522-6623</contrib-id>
<name name-style="western">
<surname>Ackerman</surname> <given-names>Benjamin</given-names></name>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Schmid</surname> <given-names>Ian</given-names></name>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Cole</surname> <given-names>Stephen R.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Stuart</surname> <given-names>Elizabeth A.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Department of Mental Health, Johns Hopkins Bloomberg School of Public Health, Baltimore, MD, United States of America</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Department of Biostatistics, Johns Hopkins Bloomberg School of Public Health, Baltimore, MD, United States of America</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>Department of Epidemiology, Gillings School of Global Public Health, University of North Carolina, Chapel Hill, NC, United States of America</addr-line>
</aff>
<aff id="aff004">
<label>4</label>
<addr-line>Department of Health Policy and Management, Johns Hopkins Bloomberg School of Public Health, Baltimore, MD, United States of America</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Mitra</surname> <given-names>Nandita</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>University of Pennsylvania, UNITED STATES</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">tnguye28@jhu.edu</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<year>2018</year>
</pub-date>
<pub-date pub-type="epub">
<day>11</day>
<month>12</month>
<year>2018</year>
</pub-date>
<volume>13</volume>
<issue>12</issue>
<elocation-id>e0208795</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>2</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>11</month>
<year>2018</year>
</date>
</history>
<permissions>
<copyright-year>2018</copyright-year>
<copyright-holder>Nguyen et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0208795"/>
<abstract>
<sec id="sec001">
<title>Background</title>
<p>Randomized controlled trials are often used to inform policy and practice for broad populations. The average treatment effect (ATE) for a target population, however, may be different from the ATE observed in a trial if there are effect modifiers whose distribution in the target population is different that from that in the trial. Methods exist to use trial data to estimate the target population ATE, provided the distributions of treatment effect modifiers are observed in both the trial and target population—an assumption that may not hold in practice.</p>
</sec>
<sec id="sec002">
<title>Methods</title>
<p>The proposed sensitivity analyses address the situation where a treatment effect modifier is observed in the trial but not the target population. These methods are based on an outcome model or the combination of such a model and weighting adjustment for observed differences between the trial sample and target population. They accommodate several types of outcome models: linear models (including single time outcome and pre- and post-treatment outcomes) for additive effects, and models with log or logit link for multiplicative effects. We clarify the methods’ assumptions and provide detailed implementation instructions.</p>
</sec>
<sec id="sec003">
<title>Illustration</title>
<p>We illustrate the methods using an example generalizing the effects of an HIV treatment regimen from a randomized trial to a relevant target population.</p>
</sec>
<sec id="sec004">
<title>Conclusion</title>
<p>These methods allow researchers and decision-makers to have more appropriate confidence when drawing conclusions about target population effects.</p>
</sec>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100006093</institution-id>
<institution>Patient-Centered Outcomes Research Institute</institution>
</institution-wrap>
</funding-source>
<award-id>ME-150227794</award-id>
<principal-award-recipient>
<name name-style="western">
<surname>Stuart</surname> <given-names>Elizabeth A.</given-names></name>
</principal-award-recipient>
</award-group>
<award-group id="award002">
<funding-source>
<institution>National Institute on Drug Abuse (US)</institution>
</funding-source>
<award-id>R01-DA036520</award-id>
</award-group>
<funding-statement>This work was supported in part by NSF grant DRL-1335843 (co-PIs E. A. Stuart and R. B. Olsen), PCORI grant ME-150227794 (co-PIs I. Dahabreh and E. A. Stuart), NIDA grant R01-DA036520 (PI R. Mojtabai), and NIAID grant R01AI100654 (PI S. R. Cole). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="3"/>
<table-count count="9"/>
<page-count count="17"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All relevant data are within the manuscript and its Supporting Information files.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec005" sec-type="intro">
<title>Introduction</title>
<p>Randomized controlled trials (<italic>trials</italic>) are often used to inform policy and practice for broad populations. A well designed and implemented trial allows consistent estimation of the average treatment/intervention effect (ATE) for the trial sample. We refer to this as the <italic>Study-specific ATE</italic> (SATE). If the question is whether that treatment should be used for people in a certain population (<italic>target population</italic>), then of interest is the <italic>Target population ATE</italic> (TATE). Since trial samples are often not representative of target populations, SATE may not be a good estimate of TATE. SATE departs from TATE if the trial sample differs from the target population with respect to the distribution of treatment effect modifiers.</p>
<p>Methods exist to use trial data to estimate TATE, e.g., [<xref ref-type="bibr" rid="pone.0208795.ref001">1</xref>–<xref ref-type="bibr" rid="pone.0208795.ref003">3</xref>], assuming treatment effect variation is explained by pre-treatment variables that are observed in both the trial and target population. Often, however, the variables observed for the target population are limited compared to those measured in the trial [<xref ref-type="bibr" rid="pone.0208795.ref004">4</xref>, <xref ref-type="bibr" rid="pone.0208795.ref005">5</xref>]. This paper presents simple methods to assess the sensitivity of TATE estimates to effect modifiers observed in the trial but not in the target population. The paper starts from the simple case of additive effects based on an uncomplicated linear model (previously addressed in [<xref ref-type="bibr" rid="pone.0208795.ref006">6</xref>]) and extends to cases with more complex models and multiplicative effects. We clarify the assumptions of these methods for a general audience and provide detailed implementation instructions.</p>
<p>We illustrate the sensitivity analyses using an example based on the AIDS Clinical Trial Group (ACTG) 320 Study [<xref ref-type="bibr" rid="pone.0208795.ref007">7</xref>]. This trial randomized HIV-infected adults to two antiretroviral regimens: (i) two nucleoside reverse-transcriptase inhibitors (AZT or d4T and 3TC) plus a protease inhibitor (Indinavir), and (ii) AZT/d4T and 3TC only—referred to as new and old treatment, respectively. The trial found that relative to the old treatment, the new treatment lowered the hazard of AIDS and/or death. Cole &amp; Stuart [<xref ref-type="bibr" rid="pone.0208795.ref001">1</xref>] generalized this effect to the population of people diagnosed with HIV in the US in 2006, using a set of covariates observed in both the trial and target population. Our example is based on this trial-population pair. We consider a different outcome, CD4 count (number of T-CD4 cells per ml blood), which is an important indicator of immunity status. We use the same target population dataset that Cole &amp; Stuart created for [<xref ref-type="bibr" rid="pone.0208795.ref001">1</xref>] based on the CDC-estimated joint distribution of demographic characteristics in this population [<xref ref-type="bibr" rid="pone.0208795.ref008">8</xref>]. As the trial data are not for open access, for this illustration, we use a synthetic trial dataset created to mimic the distributions in the real trial data.</p>
</sec>
<sec id="sec006">
<title>Methods for the simplest case: Additive effects on potential outcome based on a linear causal model</title>
<p>For this case, the basic mathematical results of the methods and one of their key assumptions were developed in [<xref ref-type="bibr" rid="pone.0208795.ref006">6</xref>]. The current paper elaborates on the full set of assumptions required by these methods, and pays close attention to details relevant to their effective use, such as different data scenarios and corresponding implementation instructions, including variation in weighting procedures for the method that involves weighting.</p>
<sec id="sec007">
<title>Trial sample, target population data, effect definitions</title>
<p>Consider a trial evaluating the effect of treatment <italic>A</italic> on outcome <italic>Y</italic>. Let <italic>S</italic> = 1 denote trial participation, <italic>P</italic> = 1 denote membership in the target population. In <xref ref-type="fig" rid="pone.0208795.g001">Fig 1</xref>, the trial sample is drawn from the target population (i.e., individuals <italic>i</italic> with <italic>S</italic><sub><italic>i</italic></sub> = 1 also have <italic>P</italic><sub><italic>i</italic></sub> = 1); and the purpose is to generalize trial results back to the target population. If the trial sample is drawn from a different population (i.e., <italic>S</italic> = 1 is outside of <italic>P</italic> = 1), the problem is to transport [<xref ref-type="bibr" rid="pone.0208795.ref009">9</xref>] results to the target population.</p>
<fig id="pone.0208795.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Several data source scenarios for generalization from the trial (<italic>S</italic> = 1) to the target population (<italic>P</italic> = 1).</title>
<p>(a) the trial sample and a full population dataset; (b) the trial sample and a dataset (<italic>S</italic> = 2) that is representative of the population; (c) the trial sample and some summary statistics about the population.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.g001" xlink:type="simple"/>
</fig>
<p>We present the methods using a binary treatment. Let <italic>Y</italic><sub><italic>i</italic></sub>(<italic>a</italic>) denote individual <italic>i</italic>’s potential outcome [<xref ref-type="bibr" rid="pone.0208795.ref010">10</xref>] if treatment were set to <italic>a</italic>, with <italic>a</italic> = 1, 0 (treatment or control). Treatment effect for individual <italic>i</italic> is defined on the additive scale as <italic>Y</italic><sub><italic>i</italic></sub>(1) − <italic>Y</italic><sub><italic>i</italic></sub>(0), the difference between potential outcomes under treatment and under control.</p>
<p>SATE is defined as the average treatment effect in the trial sample, E[<italic>Y</italic>(1) − <italic>Y</italic>(0)|<italic>S</italic> = 1]. Due to randomization, SATE is unbiasedly estimated, for example, by the difference in mean outcome between the trial’s treatment arms. Of interest, however, is TATE, defined as E[<italic>Y</italic>(1) − <italic>Y</italic>(0)|<italic>P</italic> = 1], the average treatment effect in the target population.</p>
<p>The sensitivity analyses require data on the distribution of pre-treatment covariates in the target population. Such data may come from a full population (<italic>P</italic> = 1) dataset, a representative (<italic>S</italic> = 2) sub-sample, or population summary statistics (see <xref ref-type="fig" rid="pone.0208795.g001">Fig 1</xref>).</p>
</sec>
<sec id="sec008">
<title>Assumptions</title>
<p>Several assumptions are required. The first assumption is that the trial has internal validity (A1), which itself consists of several conditions listed in <xref ref-type="table" rid="pone.0208795.t001">Table 1</xref>. We will not discuss interval validity further, but this is a key assumption. On top of this, we need a set of assumptions commonly used in generalization [<xref ref-type="bibr" rid="pone.0208795.ref001">1</xref>–<xref ref-type="bibr" rid="pone.0208795.ref003">3</xref>]: across-setting treatment variance irrelevance (A2), trial coverage of target population ranges of the effect modifiers (A3), conditional ignorability for treatment effects (A4), and consistent measurement and no measurement error (A5)—see detailed explanations of and practical comments on these assumptions in <xref ref-type="table" rid="pone.0208795.t001">Table 1</xref>.</p>
<table-wrap id="pone.0208795.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t001</object-id>
<label>Table 1</label>
<caption>
<title>Key assumptions.</title>
</caption>
<alternatives>
<graphic id="pone.0208795.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left" colspan="2">Assumption</th>
<th align="left">Details</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">A1.</td>
<td align="left">Internal validity of the trial</td>
<td align="left">We make all the assumptions required for the trial’s internal validity, e.g., conditional ignorability of treatment assignment, positivity, treatment variance irrelevance, no interference, etc.</td>
</tr>
<tr>
<td align="left">A2.</td>
<td align="left">Across-setting treatment variation irrelevance</td>
<td align="left">When a treatment is applied to the target population, it is administered in settings that are likely different from the trial setting. The assumption is that the differences in the treatment that result do not change its effect.<break/>This assumption is non-trivial in some settings and should be examined explicitly in generalization practice. In this paper, we simply make the assumption; its plausibility is not the problem we currently aim to discuss.</td>
</tr>
<tr>
<td align="left">A3.</td>
<td align="left">Treatment effect modifiers coverage</td>
<td align="left">Treatment effects depend on a set of pre-treatment variables observed in the trial (denoted <italic>Z</italic> if observed and <italic>V</italic> if not observed in the target population), and the range of these (observed and unobserved) effect modifiers in the target population is covered by their range in the trial.<break/>The rationale is that if there are members of the target population with effect modifier values outside the range observed in the trial, we cannot use trial data to learn about their treatment effects. This assumption, which is similar to positivity, is formally Pr(<italic>S</italic> = 1|<italic>Z</italic> = <italic>z</italic>, <italic>V</italic> = <italic>v</italic>) &gt; 0 if Pr(<italic>Z</italic> = <italic>z</italic>, <italic>V</italic> = <italic>v</italic>|<italic>P</italic> = 1) &gt; 0 where Pr[⋅] is the probability function [<xref ref-type="bibr" rid="pone.0208795.ref017">17</xref>]. This assumption can be checked for <italic>Z</italic> variables but not for <italic>V</italic>.</td>
</tr>
<tr>
<td align="left">A4.</td>
<td align="left">Conditional sample ignorability for treatment effects [<xref ref-type="bibr" rid="pone.0208795.ref003">3</xref>]</td>
<td align="left">For an individual (in the trial or the target population) with effect modifiers within the target population range, “sample membership” (i.e., whether the individual is in the trial or in the target population) does not carry any information about the treatment effect once we condition on the effect modifiers. For additive effects, this is formally [<italic>Y</italic>(1) − <italic>Y</italic>(0)] ⫫ {<italic>S</italic>, <italic>P</italic>}∣<italic>Z</italic>, <italic>V</italic>, (<italic>S</italic> = 1 or <italic>P</italic> = 1).<break/>This assumption allows generalizing treatment effects from individuals in the trial to individuals in the target population with similar patterns of the effect modifiers.<break/>This assumption is less strict than conditional sample ignorability for potential outcomes, {<italic>Y</italic>(1), <italic>Y</italic>(0)} ⫫ {<italic>S</italic>, <italic>P</italic>}∣<italic>X</italic>, <italic>Z</italic>, <italic>V</italic>, (<italic>S</italic> = 1 or <italic>P</italic> = 1) where <italic>X</italic> denotes predictors of the potential outcomes that are not part of the set of effect modifiers {<italic>Z</italic>, <italic>V</italic>}. Yet this assumption is tied to the scale on which effects are defined.</td>
</tr>
<tr>
<td align="left">A5.</td>
<td align="left">Consistent measurement and no measurement error</td>
<td align="left">The trial’s internal validity requires no systematic measurement error of a continuous outcome and no misclassification of a categorical outcome. Here we also need to assume that all covariate measurements are without error, and that <italic>X</italic> and <italic>Z</italic> are measured the same way between the trial and the target population.</td>
</tr>
<tr>
<td align="left">A6.</td>
<td align="left">A specific causal model</td>
<td align="left">We assume a causal model with effect modification; effects should be defined on a scale that connects naturally to the model.<break/>The main methods section assumes a linear causal model (with interaction terms) and defines effects on the additive scale.</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>Assumptions A1-A5 are sufficient for estimating TATE if all effect modifiers are observed in both the trial and target population, via either G-computation or weighting the trial sample to the target population [<xref ref-type="bibr" rid="pone.0208795.ref001">1</xref>–<xref ref-type="bibr" rid="pone.0208795.ref003">3</xref>, <xref ref-type="bibr" rid="pone.0208795.ref011">11</xref>, <xref ref-type="bibr" rid="pone.0208795.ref012">12</xref>]. When some effect modifiers are not observed in the target population, however, such strategies fail. In this case, in order to use the proposed sensitivity analyses to glean some information on TATE, we make the additional assumption (A6) of a causal model. In this section we assume the linear causal model
<disp-formula id="pone.0208795.e001"><alternatives><graphic id="pone.0208795.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e001" xlink:type="simple"/><mml:math display="block" id="M1"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>a</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>x</mml:mi></mml:msub> <mml:msub><mml:mi>X</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>z</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(M1)</label></disp-formula>
where potential outcomes are influenced by treatment condition <italic>a</italic> and baseline covariates <italic>X</italic>, <italic>Z</italic>, <italic>V</italic>, all observed in the trial. <italic>X</italic>, <italic>Z</italic> and <italic>V</italic> may be multivariate; the use of univariate notation is to simplify presentation. <italic>Z</italic> and <italic>V</italic> both denote effect modifiers; the difference is <italic>Z</italic> is observed in the target population while <italic>V</italic> is not.</p>
<p>(The letter M in the equation label <xref ref-type="disp-formula" rid="pone.0208795.e001">M1</xref> indicates that this is a causal <underline>m</underline>odel. We will also use T in labels to indicate <underline>T</underline>ATE formulas, and R to indicate <underline>r</underline>egression models).</p>
<p>This model assumption should not be made lightly. With a binary outcome, for instance, this model would imply additive effects on the risk difference scale, which may be inappropriate. (See the next section for an extension of these methods to a broader class of models). Also, the selection of which pre-treatment variables to include in the model and which variables to consider effect modifiers requires serious investigation, and is discussed is great length in relevant literature, e.g., [<xref ref-type="bibr" rid="pone.0208795.ref013">13</xref>–<xref ref-type="bibr" rid="pone.0208795.ref016">16</xref>]. With the current focus on sensitivity analysis, we presume that such a model has been selected. If unsure whether a variable is an effect modifier (e.g., because its interaction with treatment has a non-negligible coefficient but its p-value is large), our recommendation is to treat it as one for the purpose of TATE estimation, since trials usually lack power to investigate effect modification.</p>
</sec>
<sec id="sec009">
<title>TATE formula</title>
<p>Based on the causal model <xref ref-type="disp-formula" rid="pone.0208795.e001">M1</xref>, individual <italic>i</italic>’s treatment effect has expectation E[<italic>Y</italic><sub><italic>i</italic></sub>(1) − <italic>Y</italic><sub><italic>i</italic></sub>(0)] = <italic>β</italic><sub><italic>a</italic></sub> + <italic>β</italic><sub><italic>za</italic></sub> <italic>Z</italic><sub><italic>i</italic></sub> + <italic>β</italic><sub><italic>va</italic></sub> <italic>V</italic><sub><italic>i</italic></sub>, therefore
<disp-formula id="pone.0208795.e002"><alternatives><graphic id="pone.0208795.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>TATE</mml:mtext> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>V</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(T1)</label></disp-formula>
where E[<italic>Z</italic>|<italic>P</italic> = 1] and E[<italic>V</italic>|<italic>P</italic> = 1] are the means of <italic>Z</italic> and <italic>V</italic> in the target population. Under Assumptions A1-A6, <italic>β</italic><sub><italic>a</italic></sub>, <italic>β</italic><sub><italic>za</italic></sub> and <italic>β</italic><sub><italic>va</italic></sub> are the same for the trial sample and target population, and can be estimated using trial data.</p>
<p>The problematic quantity in this formula is E[<italic>V</italic>|<italic>P</italic> = 1], because we do not observe <italic>V</italic> in the target population. However, if we specify a plausible range for E[<italic>V</italic>|<italic>P</italic> = 1] (the <italic>sensitivity parameter</italic>), we obtain a range of TATE estimates. We outline here two ways to do this, and provide detailed implementation instructions in <xref ref-type="table" rid="pone.0208795.t002">Table 2</xref>.</p>
<table-wrap id="pone.0208795.t002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t002</object-id>
<label>Table 2</label>
<caption>
<title>Implementation instructions.</title>
</caption>
<alternatives>
<graphic id="pone.0208795.t002g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t002" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<tbody>
<tr>
<td align="left" colspan="2"><bold>Method 1: Outcome-model-based sensitivity analysis</bold></td>
</tr>
<tr>
<td align="left">Step 1</td>
<td align="left">Obtain an estimate for E[<italic>Z</italic>|<italic>P</italic> = 1] (mean of <italic>Z</italic> in the target population), with confidence limits to reflect uncertainty (unless it is known with certainty, e.g., from a full population dataset).</td>
</tr>
<tr>
<td align="left">Step 2</td>
<td align="left">Specify a plausible range for E[<italic>V</italic>|<italic>P</italic> = 1] (aka the <italic>sensitivity parameter</italic>).
<list list-type="bullet"><list-item><p>This range should ideally be informed by knowledge about this variable from other data or from the literature regarding the target population or similar populations.</p></list-item> <list-item><p>When little information is available, a wide range can be used so that consumers of the research could be selective in interpreting the results based on information they may have on this parameter.</p></list-item></list></td>
</tr>
<tr>
<td align="left">Step 3</td>
<td align="left">Fit to the trial data the regression model <xref ref-type="disp-formula" rid="pone.0208795.e003">R1</xref>.</td>
</tr>
<tr>
<td align="left">Step 4</td>
<td align="left">For each of the lower and upper ends of the range specified for E[<italic>V</italic>|<italic>P</italic> = 1], obtain a corresponding estimate of TATE (including point estimate and confidence limits).<break/>Suppose that for E[<italic>Z</italic>|<italic>P</italic> = 1], we have a point estimate of 2 and 95% confidence interval of (1.5, 2.5); and for E[<italic>V</italic>|<italic>P</italic> = 1], we specify a plausible range of 30 to 70. TATE corresponding to one end of this range, e.g., the lower end (E[<italic>V</italic>|<italic>P</italic> = 1] = 30), is estimated as follows:
<list list-type="bullet"><list-item><p>Point estimate: Take a linear combination of the coefficients from model <xref ref-type="disp-formula" rid="pone.0208795.e003">R1</xref>—based on the TATE formula <xref ref-type="disp-formula" rid="pone.0208795.e002">T1</xref>—using the point estimate 2 of E[<italic>Z</italic>|<italic>P</italic> = 1], that is, (<italic>β</italic><sub><italic>a</italic></sub> + 2<italic>β</italic><sub><italic>za</italic></sub> + 30<italic>β</italic><sub><italic>va</italic></sub>). This can be done using the <monospace>lincom</monospace> statement after fitting the model in <monospace>Stata</monospace> or using the <monospace>estimate</monospace> statement when specifying the model in <monospace>SAS</monospace>. The output for this linear combination includes a point estimate, standard error and confidence interval. Take the point estimate of this linear combination as the point estimate for TATE.</p></list-item> <list-item><p>Confidence limits: Use the confidence limits (1.5 and 2.5) of E[<italic>Z</italic>|<italic>P</italic> = 1] to take two additional linear combinations: (<italic>β</italic><sub><italic>a</italic></sub> + 1.5<italic>β</italic><sub><italic>za</italic></sub> + 30<italic>β</italic><sub><italic>va</italic></sub>) and (<italic>β</italic><sub><italic>a</italic></sub> + 2.5<italic>β</italic><sub><italic>za</italic></sub> + 30<italic>β</italic><sub><italic>va</italic></sub>). Consider the confidence limits of these linear combinations: take the more extreme of their two upper confidence limits, and the more extreme of their two lower confidence limits, as the confidence limits for TATE.</p></list-item></list></td>
</tr>
<tr>
<td align="left">Step 5</td>
<td align="left">Plot the range of TATE with confidence bounds (y-axis) against the range specified for the sensitivity parameter E[<italic>V</italic>|<italic>P</italic> = 1] (x-axis). Specifically,
<list list-type="bullet"><list-item><p>Plot the TATE estimates corresponding to the two ends of the range obtained in step 4, each with three points, one for the point estimate and two for the confidence limits; and</p></list-item> <list-item><p>Connect the two point estimates, the two lower confidence limits, and the two upper confidence limits, using three straight lines.</p></list-item></list></td>
</tr>
<tr>
<td align="left" colspan="2"><bold>Method 2: Weighted-utcome-model-based sensitivity analysis</bold></td>
</tr>
<tr>
<td align="left">Step 0</td>
<td align="left">Weight the trial sample so that it resembles the target population with respect to <italic>X</italic>, <italic>Z</italic>.</td>
</tr>
<tr>
<td align="left">Steps 1-2</td>
<td align="left">Same as in method 1</td>
</tr>
<tr>
<td align="left">Step 3</td>
<td align="left">Fit model <xref ref-type="disp-formula" rid="pone.0208795.e003">R1</xref> to the weighted trial sample.</td>
</tr>
<tr>
<td align="left">Step 4-5</td>
<td align="left">Same as in method 1</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
</sec>
<sec id="sec010">
<title>Method 1: Outcome-model-based sensitivity analysis</title>
<p>This method requires an estimate for E[<italic>Z</italic>|<italic>P</italic> = 1] (target population mean <italic>Z</italic>), but not a target population dataset. It involves: (1) obtaining an estimate for E[<italic>Z</italic>|<italic>P</italic> = 1]; (2) specifying a plausible range for the sensitivity parameter E[<italic>V</italic>|<italic>P</italic> = 1]; (3) fitting to trial data the regression model
<disp-formula id="pone.0208795.e003"><alternatives><graphic id="pone.0208795.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e003" xlink:type="simple"/><mml:math display="block" id="M3"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>|</mml:mo> <mml:mi>A</mml:mi> <mml:mo>,</mml:mo> <mml:mi>X</mml:mi> <mml:mo>,</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>,</mml:mo> <mml:mi>V</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mi>A</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>x</mml:mi></mml:msub> <mml:mi>X</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mi>Z</mml:mi> <mml:mi>A</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:mi>V</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mi>V</mml:mi> <mml:mi>A</mml:mi> <mml:mo>;</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(R1)</label></disp-formula>
(4) combining the estimated E[<italic>Z</italic>|<italic>P</italic> = 1] and specified E[<italic>V</italic>|<italic>P</italic> = 1] with model coefficients to obtain TATE estimates (using formula <xref ref-type="disp-formula" rid="pone.0208795.e002">T1</xref>); and (5) plotting results against the sensitivity parameter.</p>
</sec>
<sec id="sec011">
<title>Method 2: Weighted-outcome-model-based sensitivity analysis</title>
<p>If a target population dataset is available, an alternative is to weight the trial sample to mimic the target population distribution of <italic>X</italic>, <italic>Z</italic>, before implementing the same steps as in method 1.</p>
<p>Simulations (see description and full results in the <xref ref-type="supplementary-material" rid="pone.0208795.s001">S1 Appendix</xref>) found that Method 2 has an advantage over method 1 with respect to bias; it provides some protection against bias due to misspecification of the outcome model. Specifically, if the outcome model is misspecified with respect to <italic>Z</italic>, method 1 is biased, but method 2 is unbiased because the weighting adjusts for the difference between the trial and target population in effect variation due to the difference in distribution of <italic>Z</italic>. Also, if the outcome model is misspecified with respect to <italic>V</italic> then both methods are biased, but if <italic>V</italic> is positively correlated with <italic>Z</italic> in the trial and influences treatment effect in the same direction as <italic>Z</italic>, method 2 is less biased than method 1, because the weighting adjustment for <italic>Z</italic> helps partially adjust for <italic>V</italic>. Method 2’s disadvantage is that it has larger variance than method 1, and suffers from some degree of variance underestimation—the variance estimated based on the fitted outcome model is on average smaller than true variance. Bias and variance combined leads to the two methods both performing well when the outcome model is correctly specified, with the method 1 confidence interval (CI) having nominal coverage (about 95%) and the method 2 CI’s coverage being only slightly smaller (around 93-94%). When the outcome model is misspecified, due to bias reduction, method 2’s CI generally has better variance than method 1’s.</p>
<p>Given these findings, we generally recommend method 2 (with the weighting), unless the two methods agree on TATE point estimates, in which case method 1’s unweighted results can be used.</p>
<sec id="sec012">
<title>Weighting procedures</title>
<p>Method 2 involves weighting the trial sample to mimic the target population distribution of <italic>X</italic>, <italic>Z</italic>. In most situations where a population dataset (either <italic>P</italic> = 1 or <italic>S</italic> = 2—see <xref ref-type="fig" rid="pone.0208795.g001">Fig 1</xref>) is available, we use <italic>weighting by the odds</italic> [<xref ref-type="bibr" rid="pone.0208795.ref003">3</xref>, <xref ref-type="bibr" rid="pone.0208795.ref018">18</xref>]. The exception is when trial participants are part of AND can be identified within the population dataset, then <italic>inverse probability weighting</italic> is used. If only population summary statistics are available, weighting is generally not used. However, if information on the joint distribution of <italic>X</italic>, <italic>Z</italic> in the target population is available, and <italic>X</italic>, <italic>Z</italic> are discrete with few combined categories, weighting may be implemented. See <xref ref-type="table" rid="pone.0208795.t003">Table 3</xref> for details on weights computation in these cases. For why they apply, see the <xref ref-type="supplementary-material" rid="pone.0208795.s002">S2 Appendix</xref>.</p>
<table-wrap id="pone.0208795.t003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t003</object-id>
<label>Table 3</label>
<caption>
<title>Weighting procedures for different target population data scenarios.</title>
</caption>
<alternatives>
<graphic id="pone.0208795.t003g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t003" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left">Target population data</th>
<th align="left">Weighting procedures</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">A <italic>P</italic> = 1 dataset is available. Trial participants cannot be identified in this <italic>P</italic> = 1 dataset.</td>
<td align="left" rowspan="2"><italic><bold>Weighting-by-the-odds</bold></italic>, i.e., weight the trial participants using weights computed as follows
<list list-type="order"><list-item><p>stacking the trial and target population datasets into one dataset, and creating a new variable <italic>S</italic>′ coded <italic>S</italic>′ = 1 for observations from the trial dataset, and <italic>S</italic>′ = 0 for observations from the target population dataset</p></list-item> <list-item><p>fitting a model using <italic>X</italic> and <italic>Z</italic> to predict <italic>S</italic>′; and for each trial participant, obtaining the predicted probability of <italic>S</italic>′ = 1 from that model (aka the trial <italic>participation score</italic>), <italic>ps</italic><sub><italic>i</italic></sub> = Pr(<italic>S</italic>′ = 1|<italic>X</italic><sub><italic>i</italic></sub>, <italic>Z</italic><sub><italic>i</italic></sub>)</p></list-item> <list-item><p>for every trial participant, computing the weights as <italic>W</italic><sub><italic>i</italic></sub> = (1 − <italic>ps</italic><sub><italic>i</italic></sub>)/<italic>ps</italic><sub><italic>i</italic></sub>, the odds of being in the target population dataset.</p></list-item></list></td>
</tr>
<tr>
<td align="left">A <italic>S</italic> = 2 dataset is available. Trial participants are either not part of the <italic>S</italic> = 2 sample, or if they are, they cannot be identified in this <italic>S</italic> = 2 dataset.</td>
</tr>
<tr>
<td align="left">A <italic>P</italic> = 1 dataset is available. Trial participants are identified in this <italic>P</italic> = 1 dataset.</td>
<td align="left" rowspan="2"><italic><bold>Inverse-probability-weighting</bold></italic>, i.e., weight the trial participants using weights computed as follows
<list list-type="order"><list-item><p>using the target poplation dataset, creating a new variable <italic>S</italic>′ coded <italic>S</italic>′ = 1 for observations that belong to the trial participants, and <italic>S</italic>′ = 0 for the remaining observations</p></list-item> <list-item><p>fitting a model using <italic>X</italic> and <italic>Z</italic> to predict <italic>S</italic>′; and for each trial participant, obtaining the predicted probability of <italic>S</italic>′ = 1 from that model (aka the trial <italic>participation score</italic>), <italic>ps</italic><sub><italic>i</italic></sub> = Pr(<italic>S</italic>′ = 1|<italic>X</italic><sub><italic>i</italic></sub>, <italic>Z</italic><sub><italic>i</italic></sub>)</p></list-item> <list-item><p>for every trial participant, computing the weights as <italic>W</italic><sub><italic>i</italic></sub> = 1/<italic>ps</italic><sub><italic>i</italic></sub>, the inverse of the probability of participating in the trial.</p></list-item></list></td>
</tr>
<tr>
<td align="left">A <italic>S</italic> = 2 dataset is available. Trial participants are part of the <italic>S</italic> = 2 sample, and are identified in this <italic>S</italic> = 2 dataset.</td>
</tr>
<tr>
<td align="left">Information on the joint distribution of {<italic>X</italic>, <italic>Z</italic>} in the target population is available.<break/><italic>X</italic>, <italic>Z</italic> are categorical with a small number of combined categories.</td>
<td align="left"><italic><bold>Ratio-of-probability-weighting</bold></italic>, specifically, weight the trial participants using weights computed by the formula <inline-formula id="pone.0208795.e004"><alternatives><graphic id="pone.0208795.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e004" xlink:type="simple"/><mml:math display="inline" id="M4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>W</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>(</mml:mo> <mml:mi>X</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>X</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>(</mml:mo> <mml:mi>X</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>X</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:mi>S</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math></alternatives></inline-formula>, where the numerator and denominator are the prevalences of the {<italic>X</italic><sub><italic>i</italic></sub>, <italic>Z</italic><sub><italic>i</italic></sub>} pattern in the target population and in the trial sample, respectively.</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>An additional note: The desired result of weighting is that the arms of the trial (i) each mimics the target population in the distribution of <italic>X</italic>, <italic>Z</italic>, and (ii) remain similar to each other in the distribution of <italic>X</italic>, <italic>Z</italic>, <italic>V</italic>. We recommend a two step procedure: first checking balance between the trial arms and adjusting via within-trial reweighting if needed; and then weighting the (adjusted) trial sample to the target population. We do not recommend weighting each trial arm to the target population separately, because it may distort between-arms balance on variables not observed in the target population.</p>
</sec>
</sec>
<sec id="sec013">
<title>What if an effect modifier is not even observed in the trial?</title>
<p>There are times when instead of an effect modifier observed in the trial but not in the target population, researchers are concerned about effect modifiers that were not measured in the trial. This may be a specific variable, e.g., addiction severity was not measured in a substance abuse treatment trial, but it is suspected to modify treatment effect and it may very well be distributed differently between the trial and the target population. Or it may be generic, when researchers are concerned that there is effect modification by unknown factors.</p>
<p>The question is whether the above-described sensitivity analyses can be extended to cover an effect modifier <italic>U</italic> (be it a specific or generic variable) that is unobserved in the trial. Unfortunately, the answer is no. It is clear from the causal model
<disp-formula id="pone.0208795.e005"><alternatives><graphic id="pone.0208795.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e005" xlink:type="simple"/><mml:math display="block" id="M5"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>a</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>x</mml:mi></mml:msub> <mml:msub><mml:mi>X</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>z</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>u</mml:mi></mml:msub> <mml:msub><mml:mi>U</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>u</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>U</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
that if we use the approach without weighting, we would need an estimate of <italic>β</italic><sub><italic>za</italic></sub>, which is unidentified from the trial because <italic>U</italic> is not observed. If we use the weighting approach and manage to equate the mean of <italic>Z</italic> between the trial sample and the target population, then we could do without <italic>β</italic><sub><italic>za</italic></sub> but instead would have to deal with the mean of <italic>U</italic> in the weighted trial sample, an obscure quantity that is not suitable to serve as a sensitivity parameter. (For technical details, see the <xref ref-type="supplementary-material" rid="pone.0208795.s003">S3 Appendix</xref>).</p>
<p>Note that this is a correction of the <italic>U</italic> case results reported in [<xref ref-type="bibr" rid="pone.0208795.ref006">6</xref>]; the appendix explains the error in those previous results.</p>
</sec>
</sec>
<sec id="sec014">
<title>Method extensions</title>
<p>Turning our attention back to effect modifiers that are observed in the trial but not in the target population (<italic>V</italic>), note that the last section (and [<xref ref-type="bibr" rid="pone.0208795.ref006">6</xref>]) addressed a simple setting. We now offer two extensions of the sensitivity analyses to more complex situations.</p>
<sec id="sec015">
<title>Extension 1: When both pre- and post-treatment outcomes are available and are modeled using random intercepts models</title>
<p>When both pre- and post-treatment measures of the outcome are available, there are several options for modeling such data. One option is to treat the pre-treatment outcome measure as a baseline covariate. Another option, which we consider here, is to model the combination of both pre- and post-treatment outcomes using random intercepts models.</p>
<p>The simplest random intercepts model in this case is the model without covariates
<disp-formula id="pone.0208795.e006"><alternatives><graphic id="pone.0208795.e006g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e006" xlink:type="simple"/><mml:math display="block" id="M6"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mrow><mml:mi>i</mml:mi> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mo>|</mml:mo> <mml:msub><mml:mi>A</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>F</mml:mi> <mml:mrow><mml:mi>i</mml:mi> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:msub><mml:mi>c</mml:mi> <mml:mrow><mml:mn>0</mml:mn> <mml:mi>i</mml:mi></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:msub><mml:mi>A</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>f</mml:mi></mml:msub> <mml:msub><mml:mi>F</mml:mi> <mml:mrow><mml:mi>i</mml:mi> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mrow><mml:mi>f</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>F</mml:mi> <mml:mrow><mml:mi>i</mml:mi> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>A</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <italic>i</italic> indexes person, <italic>j</italic> indexes observation (each person has two observations), <italic>A</italic> indicates treatment arm, <italic>F</italic> indicates whether the observation is pre-treatment (<italic>F</italic><sub><italic>i</italic>1</sub> = 0) or post-treatment (<italic>F</italic><sub><italic>i</italic>2</sub> = 1), and the coefficient <italic>γ</italic><sub><italic>fa</italic></sub> of <italic>FA</italic> represents treatment effect. Given randomization of treatment in the trial, when this model is fit to the trial data, <italic>γ</italic><sub><italic>fa</italic></sub> estimates SATE. Note that the coefficient of <italic>FA</italic> in models with baseline covariates (<italic>X</italic>, <italic>Z</italic>, <italic>V</italic>) that may interact with <italic>A</italic> or <italic>F</italic> but not with <italic>FA</italic> also estimates SATE; such models adjust for covariates when estimating the average treatment effect.</p>
<p>For the sensitivity analyses, we assume a model with effect modification analogous to <xref ref-type="disp-formula" rid="pone.0208795.e001">M1</xref>. The full details, which are somewhat more complicated than are informative, are relegated to the <xref ref-type="supplementary-material" rid="pone.0208795.s004">S4 Appendix</xref>. The key point is that this model includes not only the <italic>FA</italic> term (<italic>β</italic><sub><italic>fa</italic></sub> <italic>F</italic><sub><italic>ij</italic></sub> <italic>A</italic><sub><italic>i</italic></sub>), but also interaction terms of effect modifiers with <italic>FA</italic> (<italic>β</italic><sub><italic>zfa</italic></sub> <italic>Z</italic><sub><italic>i</italic></sub> <italic>F</italic><sub><italic>ij</italic></sub> <italic>A</italic><sub><italic>i</italic></sub> and <italic>β</italic><sub><italic>vfa</italic></sub> <italic>V</italic><sub><italic>i</italic></sub> <italic>F</italic><sub><italic>ij</italic></sub> <italic>A</italic><sub><italic>i</italic></sub>). The TATE formula in this case is
<disp-formula id="pone.0208795.e007"><alternatives><graphic id="pone.0208795.e007g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e007" xlink:type="simple"/><mml:math display="block" id="M7"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>TATE</mml:mtext> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>f</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>f</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>f</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>V</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(T2)</label></disp-formula></p>
<p>This formula is used with both method 1 and method 2—when the effect modification regression model is fit to the unweighted and weighted trial data, respectively.</p>
<p>While it is usually natural to clarify effect definitions before discussing models used to estimate such effects, in this section we have done the opposite, starting with models first. This choice is intentional because in the current case it is easier to point out the effect definition after explaining the model. As <italic>FA</italic> is an interaction of treatment arm and time (post- vs. pre-treatment), its coefficient represents a difference in difference, specifically a difference between the two treatment conditions with respect to the difference between post- and pre-treatment outcomes in each condition. This means the individual treatment effect definition here is the effect of treatment on the ‘potential outcome change’ from before to after treatment. Since pre-treatment outcome is not affected by treatment, this is equivalent to the effect of treatment on the potential post-treatment outcome. That is, the TATE and SATE in this case are exactly the same average effects defined in the previous section.</p>
</sec>
<sec id="sec016">
<title>Extension 2: Multiplicative effects on potential outcome rate/probability/odds, based on a log/logit link model</title>
<p>In the previous section, we commented that the linear model assumption is not always appropriate. We now extend the methods to cases where log/logit link outcome models are used (e.g., log mean model for a count outcome, log probability or logit model for a binary outcome). Here the individual treatment effect is defined on the multiplicative scale that matches the model (e.g., rate ratio, risk ratio, or odds ratio), and an ATE is defined as the geometric mean of the individual effects. Or equivalently, one could define the individual effect as the corresponding log rate ratio, log risk ratio or log odds ratio, and have the usual definition of ATE as the arithmetic mean of individual effects.</p>
<p>We describe the extension formally here using a binary outcome with logit model (leaving details for the other cases in the <xref ref-type="supplementary-material" rid="pone.0208795.s005">S5 Appendix</xref>). In this case we assume the logistic causal model
<disp-formula id="pone.0208795.e008"><alternatives><graphic id="pone.0208795.e008g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e008" xlink:type="simple"/><mml:math display="block" id="M8"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>log</mml:mtext> <mml:mo>{</mml:mo> <mml:mfrac><mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>a</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>a</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>]</mml:mo></mml:mrow></mml:mfrac> <mml:mo>}</mml:mo> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>x</mml:mi></mml:msub> <mml:msub><mml:mi>X</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>z</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mi>a</mml:mi> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(M3)</label></disp-formula>
the coefficients of which can be estimated by fitting the logistic regression model
<disp-formula id="pone.0208795.e009"><alternatives><graphic id="pone.0208795.e009g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e009" xlink:type="simple"/><mml:math display="block" id="M9"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>log</mml:mtext> <mml:mo>{</mml:mo> <mml:mfrac><mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>|</mml:mo> <mml:mi>A</mml:mi> <mml:mo>,</mml:mo> <mml:mi>X</mml:mi> <mml:mo>,</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>,</mml:mo> <mml:mi>V</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>|</mml:mo> <mml:mi>A</mml:mi> <mml:mo>,</mml:mo> <mml:mi>X</mml:mi> <mml:mo>,</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>,</mml:mo> <mml:mi>V</mml:mi> <mml:mo>]</mml:mo></mml:mrow></mml:mfrac> <mml:mo>}</mml:mo> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mi>A</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>x</mml:mi></mml:msub> <mml:mi>X</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>z</mml:mi></mml:msub> <mml:mi>Z</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mi>Z</mml:mi> <mml:mi>A</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:mi>V</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mi>V</mml:mi> <mml:mi>A</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(R3)</label></disp-formula>
to the original or the weighted trial sample (corresponding to method 1 or 2). Define the individual treatment effect as the odds ratio (OR) of the individual’s potential outcomes,
<disp-formula id="pone.0208795.e010"><alternatives><graphic id="pone.0208795.e010g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e010" xlink:type="simple"/><mml:math display="block" id="M10"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:msubsup><mml:mtext>TE</mml:mtext> <mml:mi>i</mml:mi> <mml:mtext>OR</mml:mtext></mml:msubsup> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:mtext>Pr</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>]</mml:mo></mml:mrow></mml:mrow> <mml:mrow><mml:mtext>Pr</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mn>0</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:mtext>Pr</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mn>0</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:mfrac> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
or the corresponding log OR
<disp-formula id="pone.0208795.e011"><alternatives><graphic id="pone.0208795.e011g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e011" xlink:type="simple"/><mml:math display="block" id="M11"><mml:mrow><mml:msubsup><mml:mrow><mml:mtext>TE</mml:mtext></mml:mrow><mml:mi>i</mml:mi><mml:mrow><mml:mtext>log</mml:mtext><mml:mo>_</mml:mo><mml:mtext>OR</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mtext>log</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mtext>TE</mml:mtext></mml:mrow><mml:mi>i</mml:mi><mml:mrow><mml:mtext>OR</mml:mtext></mml:mrow></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>.</mml:mo></mml:mrow></mml:math></alternatives></disp-formula></p>
<p>Model <xref ref-type="disp-formula" rid="pone.0208795.e008">M3</xref> implies,
<disp-formula id="pone.0208795.e012"><alternatives><graphic id="pone.0208795.e012g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e012" xlink:type="simple"/><mml:math display="block" id="M12"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:msubsup><mml:mrow><mml:mtext>TE</mml:mtext></mml:mrow><mml:mi>i</mml:mi><mml:mrow><mml:mtext>log</mml:mtext><mml:mo>_</mml:mo><mml:mtext>OR</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:msubsup><mml:mtext>TE</mml:mtext> <mml:mi>i</mml:mi> <mml:mtext>OR</mml:mtext></mml:msubsup> <mml:mo>=</mml:mo> <mml:mo form="prefix">exp</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>V</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>On the log OR scale, we have the familiar formula
<disp-formula id="pone.0208795.e013"><alternatives><graphic id="pone.0208795.e013g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e013" xlink:type="simple"/><mml:math display="block" id="M13"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msup><mml:mtext>TATE</mml:mtext><mml:mrow><mml:mtext>log</mml:mtext><mml:mo>_</mml:mo><mml:mtext>OR</mml:mtext></mml:mrow></mml:msup> <mml:mo>=</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>V</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(T3a)</label></disp-formula>
for TATE defined as the average of the individual effects in the target population. Note that ‘average’ in this definition means arithmetic mean. For effects defined on the OR scale, however, the arithmetic mean does not have a nice formula. Yet we can use another type of average that is natural to quantities on a multiplicative scale and thus is both meaningful and mathematically convenient in this case, the geometric mean. Defining TATE on the OR scale as the geometric mean of the individual ORs in the target population, we obtain
<disp-formula id="pone.0208795.e014"><alternatives><graphic id="pone.0208795.e014g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0208795.e014" xlink:type="simple"/><mml:math display="block" id="M14"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msup><mml:mtext>TATE</mml:mtext> <mml:mtext>OR</mml:mtext></mml:msup> <mml:mo>=</mml:mo> <mml:mo form="prefix">exp</mml:mo> <mml:mrow><mml:mo>{</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>a</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>z</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>+</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mrow><mml:mi>v</mml:mi> <mml:mi>a</mml:mi></mml:mrow></mml:msub> <mml:mtext>E</mml:mtext> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>V</mml:mi> <mml:mo>|</mml:mo> <mml:mi>P</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>}</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(T3b)</label></disp-formula></p>
<p>These two TATE formulas serve as the basis for essentially the same sensitivity analyses, as TATE<sup>OR</sup> = exp(TATE<sup>log_OR</sup>).</p>
<p>As an aside, an ATE defined as geometric mean of individual OR effects (termed <italic>average causal OR</italic>) is closely related to the conditional OR routinely estimated by logistic regression with main effects only. Indeed the latter is an approximate estimate of the former (see more about this in the <xref ref-type="supplementary-material" rid="pone.0208795.s005">S5 Appendix</xref>).</p>
</sec>
</sec>
<sec id="sec017">
<title>Illustration</title>
<p>The analyses presented here are merely illustrative. Results should not be taken as clinically informative. In addition to the concise presentation here, the detailed analyses can be found in <xref ref-type="supplementary-material" rid="pone.0208795.s006">S6 Appendix</xref>, with most of the code (R-code) included in the same appendix, and some Stata code in <xref ref-type="supplementary-material" rid="pone.0208795.s007">S7 Appendix</xref>. The data are provided in <xref ref-type="supplementary-material" rid="pone.0208795.s008">S8</xref> and <xref ref-type="supplementary-material" rid="pone.0208795.s009">S9</xref> Appendices.</p>
<p>The trial data include baseline and post-treatment CD4 counts and several baseline characteristics—age in years, sex, race, and severe immune suppression (SIS). The target population data include age groups, sex, and race. See <xref ref-type="table" rid="pone.0208795.t004">Table 4</xref> for a description of these variables. As noted above, when data include pre- and post-treatment measures of the outcome, there are more than one analysis options. Here we use random intercepts models on the combination of both measures. (For an application modeling post-treatment outcome only, see [<xref ref-type="bibr" rid="pone.0208795.ref006">6</xref>]). The definition of TATE is the average effect of treatment on potential CD4 count gain, and equivalently, the average effect of treatment on potential CD4 count post-treatment, in the target population.</p>
<table-wrap id="pone.0208795.t004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t004</object-id>
<label>Table 4</label>
<caption>
<title>Illustration.</title><p>Data availability.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t004g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t004" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left" rowspan="2">Variable</th>
<th align="left" rowspan="2">Description</th>
<th align="center" colspan="2">Observed in</th>
</tr>
<tr>
<th align="center">trial</th>
<th align="center">population</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">Pre-treatment CD4 count</td>
<td align="left">CD4 count, i.e., number of T-CD4 cells per ml blood, within 10 days of treatment initiation (average if more than one available)</td>
<td align="center">✔</td>
<td align="center"/>
</tr>
<tr>
<td align="left">Post-treatment CD4 count</td>
<td align="left">CD4 count within 10 days of two months on treatment (average if more than one available)</td>
<td align="center">✔</td>
<td align="center"/>
</tr>
<tr>
<td align="left">Continuous age</td>
<td align="left">Age in years</td>
<td align="center">✔</td>
<td align="center"/>
</tr>
<tr>
<td align="left">Categorical age</td>
<td align="left">4 categories: up to 29, 30-39, 40-49, and 50+</td>
<td align="center">✔</td>
<td align="center">✔</td>
</tr>
<tr>
<td align="left">Sex</td>
<td align="left">Binary, male or female</td>
<td align="center">✔</td>
<td align="center">✔</td>
</tr>
<tr>
<td align="left">Race</td>
<td align="left">Dichotomized as White or non-White</td>
<td align="center">✔</td>
<td align="center">✔</td>
</tr>
<tr>
<td align="left">Severe immune suppression</td>
<td align="left">Any CD4 count of 50 or lower within the baseline period</td>
<td align="center">✔</td>
<td align="center"/>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>We start by analyzing the trial data. The first question is whether to model CD4 count (and thereby consider its change) on the additive or multiplicative scale. CD4 count is a non-negative variable, so the additive scale may predict out of range, but it is also generally bounded above, which is more restrictive on multiplicative than on additive effects. We follow the HIV literature convention of using the additive scale for CD4 count, noting that our models may be suboptimal in this respect.</p>
<p>The two treatment arms in the trial are similar but the new treatment arm has more female patients and the old treatment arm has a higher SIS proportion (see <xref ref-type="table" rid="pone.0208795.t005">Table 5</xref>). For the moment, assume we have good enough balance; we will come back to this.</p>
<table-wrap id="pone.0208795.t005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t005</object-id>
<label>Table 5</label>
<caption>
<title>Illustration.</title><p>Covariate balance within the trial sample.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t005g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t005" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="right">New treatment<break/>(n = 478)</th>
<th align="right">Old treatment<break/>(n = 455)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">Age (mean)</td>
<td align="char" char=".">39.4</td>
<td align="char" char=".">39.5</td>
</tr>
<tr>
<td align="left">Sex (proportion female)</td>
<td align="char" char=".">0.174</td>
<td align="char" char=".">0.143</td>
</tr>
<tr>
<td align="left">Race (proportion nonWhite)</td>
<td align="char" char=".">0.473</td>
<td align="char" char=".">0.468</td>
</tr>
<tr>
<td align="left">SIS (proportion)</td>
<td align="char" char=".">0.437</td>
<td align="char" char=".">0.475</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>SATE (i.e., the average difference, between the two treatments in the trial, in CD4 count change, or equivalently, in post-treatment CD4 counts) is estimated to be 36.6, 95% CI = (28.0,45.2) cells/ml by a simple model with no covariates, and 35.8, 95% CI = (27.3,44.4) by a model that adjusts for baseline covariates. <xref ref-type="table" rid="pone.0208795.t006">Table 6</xref> shows substantial differences in covariate distribution between the trial sample and target population, suggesting these SATE estimates should not be used as estimates of TATE.</p>
<table-wrap id="pone.0208795.t006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t006</object-id>
<label>Table 6</label>
<caption>
<title>Illustration.</title><p>Covariate distribution in the trial sample and target population.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t006g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t006" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="right">Trial sample<break/>(n = 933)</th>
<th align="right">Target population<break/>(n = 54,220)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">Age (mean)</td>
<td align="right">39.5</td>
<td align="right">not available</td>
</tr>
<tr>
<td align="left">Age (range)</td>
<td align="right">16 to 75</td>
<td align="right">13 to 80</td>
</tr>
<tr>
<td align="left">Age groups (proportions)</td>
<td align="right"/>
<td align="right"/>
</tr>
<tr>
<td align="left"> 29 and younger</td>
<td align="right">0.107</td>
<td align="right">0.341</td>
</tr>
<tr>
<td align="left"> 30 to 39</td>
<td align="right">0.421</td>
<td align="right">0.309</td>
</tr>
<tr>
<td align="left"> 40 to 49</td>
<td align="right">0.348</td>
<td align="right">0.247</td>
</tr>
<tr>
<td align="left"> 50 and older</td>
<td align="right">0.123</td>
<td align="right">0.103</td>
</tr>
<tr>
<td align="left">Sex (proportion female)</td>
<td align="right">0.159</td>
<td align="right">0.266</td>
</tr>
<tr>
<td align="left">Race (proportion nonWhite)</td>
<td align="right">0.471</td>
<td align="right">0.639</td>
</tr>
<tr>
<td align="left">SIS (proportion)</td>
<td align="right">0.456</td>
<td align="right">not available</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>Through a simple analysis examining interactions of <italic>FA</italic> with baseline covariates (e.g., <italic>FA</italic>*sex), covariate pairs (e.g., <italic>FA</italic>*sex*age), and cross-classifications of categorical covariates (e.g., <italic>FA</italic>*‘nonwhite-female’), we identify that the cross-classification of race and SIS status is an effect modifier (see <xref ref-type="table" rid="pone.0208795.t007">Table 7</xref>). This variation in treatment effects is visualized in <xref ref-type="fig" rid="pone.0208795.g002">Fig 2</xref>.</p>
<table-wrap id="pone.0208795.t007" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t007</object-id>
<label>Table 7</label>
<caption>
<title>Illustration.</title><p>Excerpt from effect modification model<xref ref-type="table-fn" rid="t007fn001"><sup>a</sup></xref> fit to trial data.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t007g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t007" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="right">Estimate</th>
<th align="right">Std. Error</th>
<th align="right">df</th>
<th align="right">t value</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left"><italic>FA</italic></td>
<td align="char" char=".">19.72150</td>
<td align="char" char=".">7.862622</td>
<td align="right">923</td>
<td align="char" char=".">2.508260</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * nonWhite-noSIS</td>
<td align="char" char=".">23.44112</td>
<td align="char" char=".">11.979436</td>
<td align="right">923</td>
<td align="char" char=".">1.956780</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * White-SIS</td>
<td align="char" char=".">24.93563</td>
<td align="char" char=".">12.135934</td>
<td align="right">923</td>
<td align="char" char=".">2.054694</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * nonWhite-SIS</td>
<td align="char" char=".">21.43789</td>
<td align="char" char=".">11.956149</td>
<td align="right">923</td>
<td align="char" char=".">1.793043</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t007fn001"><p><sup>a</sup> The referent category is White-noSIS. The other covariates included are age and sex.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="pone.0208795.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Illustration.</title><p>Visualization of effect modification model.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.g002" xlink:type="simple"/>
</fig>
<p>As treatment effects vary across race-by-SIS-status categories, to obtain TATE estimates, we need the proportions of the target population that are in these categories. Race is observed in the target population, with 63.9% being nonwhite. SIS status (in the white and nonwhite groups), however, is not observed. If this were a substantive study, we would comb the literature to seek a plausible range for the proportions with SIS among White and among nonWhite people in the target population. As this is only illustrative, we specify a wide range (0.2, 0.6) for this proportion (which covers the proportion 0.456 in the trial), and assume that this proportion is the same between White and nonWhite people in the target population. With this assumption, this single proportion with SIS in the target population is now our <italic>sensitivity parameter</italic>.</p>
<p>A comment is warranted on assumption A3, that the range of the treatment effect modifiers in the target population is covered by the trial. In the current example, it is apparent that we do not have a problem with this assumption, because effect modification involves the four race-by-SIS-status categories, all of which are present in the trial sample. What might go unnoticed is that the age range in the trial sample (16 to 75) is smaller than that in the target population (13 to 80), and while we did not detect any treatment effect modification by age in the trial sample, we do not know if treatment effects for those younger than 16 or older than 75 (who are not represented in the trial sample) are the same as or different from treatment effects for those in the trial sample age range; this would be an area to consult clinical experts for their judgment. In the absence of such expert knowledge, were actual age values (rather than just age group) observed in the target population, one option would be to generalize treatment effects only to those aged 16 to 75 in the target population. This target population trimming is not an option in the current case as age values are not observed. In order to move forward, we assume that there is no effect modification by age.</p>
<p>We now apply the <italic>outcome-model-based sensitivity analysis</italic> (method 1) with the specified (0.2, 0.6) range for the sensitivity parameter (proportion with SIS in the target population). This obtains a range of TATE estimates from 36.2, 95% CI = (25.9,46.6) (corresponding to the lower end of the sensitivity parameter range) to 39.3, 95% CI = (30.0,48.6) (corresponding to the upper end of the sensitivity parameter range).</p>
<p>To apply the <italic>weighted-outcome-model-based sensitivity analysis</italic> (method 2), we need to weight the trial data to mimic the target population with respect to covariates observed in both (age group, sex, race). Heeding the recommendation of the two-step procedure, we first adjust the between-arms balance in the trial sample by inverse treatment propensity score weighting. Note that this results in a balance-adjusted SATE estimate of 33.9, 95% CI = (25.4, 42.3), which is very similar to (but slightly smaller than) the original SATE estimates. The effect modification model fit to the balance-adjusted trial data is very similar to that fit to the raw trial data. If we use that model and apply method 1, we obtain TATE estimates ranging from 34.2, 95% CI = (23.5, 44.8) to 37.1, 95% CI = (28.5, 45.7); these are slightly lower than those based on the model fit to the raw data. To use method 2, after adjusting within-trial balance, we weight the adjusted trial sample to the target population, using the weighting-by-the-odds procedure described in <xref ref-type="table" rid="pone.0208795.t003">Table 3</xref>. This results in covariate balance shown in <xref ref-type="table" rid="pone.0208795.t008">Table 8</xref>. The ATE in this weighted trial sample (which we will refer to as the (<italic>X</italic>, <italic>Z</italic>)- adjusted ATE) is 37.4, 95% CI = (27.0, 47.8), which is slightly higher than our SATE estimates. This is consistent with the fact that the weighted trial sample has higher nonWhite and SIS proportions than the original trial sample.</p>
<table-wrap id="pone.0208795.t008" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t008</object-id>
<label>Table 8</label>
<caption>
<title>Illustration.</title><p>Covariate balance between two trial arms and target population after weighting.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t008g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t008" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="right">Trial: new<break/>(n = 478)</th>
<th align="right">Trial: old<break/>(n = 455)</th>
<th align="right">Target population<break/>(n = 54,220)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">Age (mean)</td>
<td align="right">35.8</td>
<td align="right">36.1</td>
<td align="right">not available</td>
</tr>
<tr>
<td align="left">Age (range)</td>
<td align="right">16 to 75</td>
<td align="right">16 to 75</td>
<td align="right">13 to 80</td>
</tr>
<tr>
<td align="left">Age groups (proportions)</td>
<td align="right"/>
<td align="right"/>
<td align="right"/>
</tr>
<tr>
<td align="left"> 29 and younger</td>
<td align="right">0.349</td>
<td align="right">0.333</td>
<td align="right">0.341</td>
</tr>
<tr>
<td align="left"> 30 to 39</td>
<td align="right">0.304</td>
<td align="right">0.313</td>
<td align="right">0.309</td>
</tr>
<tr>
<td align="left"> 40 to 49</td>
<td align="right">0.247</td>
<td align="right">0.246</td>
<td align="right">0.247</td>
</tr>
<tr>
<td align="left"> 50 and older</td>
<td align="right">0.100</td>
<td align="right">0.107</td>
<td align="right">0.103</td>
</tr>
<tr>
<td align="left">Sex (proportion female)</td>
<td align="right">0.272</td>
<td align="right">0.260</td>
<td align="right">0.266</td>
</tr>
<tr>
<td align="left">Race (proportion nonWhite)</td>
<td align="right">0.642</td>
<td align="right">0.636</td>
<td align="right">0.639</td>
</tr>
<tr>
<td align="left">SIS (proportion)</td>
<td align="right">0.515</td>
<td align="right">0.522</td>
<td align="right">not available</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>We now fit the same effect modification model to the weighted trial sample (see model fit in <xref ref-type="table" rid="pone.0208795.t009">Table 9</xref>). Interestingly, the coefficients have changed substantially from the model fit to raw data (<xref ref-type="table" rid="pone.0208795.t007">Table 7</xref>). This is not surprising as it could be a result of model misspecification (which we suspected), and it underscores our recommendation to use the weighted method so that the model that is the basis for estimating (sensitivity analysis of) TATE is the model fit to data that is close to the target population with respect to observed variables.</p>
<table-wrap id="pone.0208795.t009" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.t009</object-id>
<label>Table 9</label>
<caption>
<title>Illustration.</title><p>Excerpt from effect modification model fit to trial data that have been weighted to the target population.</p>
</caption>
<alternatives>
<graphic id="pone.0208795.t009g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.t009" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left"/>
<th align="right">Estimate</th>
<th align="right">Std. Error</th>
<th align="right">z value</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left"><italic>FA</italic></td>
<td align="char" char=".">32.903852</td>
<td align="char" char=".">11.93896</td>
<td align="char" char=".">2.76</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * nonWhite-noSIS</td>
<td align="char" char=".">9.335134</td>
<td align="char" char=".">15.74757</td>
<td align="char" char=".">0.59</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * White-SIS</td>
<td align="char" char=".">4.593148</td>
<td align="char" char=".">14.53369</td>
<td align="char" char=".">0.32</td>
</tr>
<tr>
<td align="left"><italic>FA</italic> * nonWhite-SIS</td>
<td align="char" char=".">3.294465</td>
<td align="char" char=".">15.46597</td>
<td align="char" char=".">0.21</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>Generally we should not read much into the (lack of) statistical significance of interaction terms in the weighted model because weighting increases variance. However, the underwhelming coefficients in the fitted model above suggest that in the weighted dataset, there is not much differentiation of the group specific effects, and one could argue for using the (<italic>X</italic>, <italic>Z</italic>)-adjusted ATE as an estimate of TATE.</p>
<p>Or we could choose to proceed with a full implementation of method 2. Based on this effect modification model, we obtain TATE estimates ranging from 38.4, 95% CI = (26.0,50.9) (corresponding to the lower end, 0.20, of the range of the sensitivity parameter) to 37.5, 95% CI = (27.4,47.7) (corresponding to the upper end, 0.60, of the range of the sensitivity parameter).</p>
<p>Results from both methods are plotted in <xref ref-type="fig" rid="pone.0208795.g003">Fig 3</xref>. In this particular case, as there is not a clear slope of TATE estimates on the sensitivity parameter, we could combine these results to conclude that when between 20 and 60% of the target population have SIS, we could expect the target population average effect of the new treatment (relative to the old treatment) to be a gain in CD4 count of about 36 to 39 cells per ml (point estimate) with lower and upper confidence bounds of 26 and 51.</p>
<fig id="pone.0208795.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0208795.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Illustration.</title><p>Results from both methods.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.g003" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec018" sec-type="conclusions">
<title>Discussion</title>
<p>Policy-makers may want to use trial results to inform decisions for specific target populations. There are now methods to calibrate trial results to target populations, increasing potential for evidence-based decision-making [<xref ref-type="bibr" rid="pone.0208795.ref019">19</xref>]. However, these methods generally rely on a strong assumption that all effect modifiers differentially distributed between sample and population are observed and can be adjusted for. In this paper, we describe sensitivity analyses when this is not the case. Sensitivity analyses such as these allow researchers and decision-makers to have more appropriate confidence about population effects.</p>
<p>The methods proposed in this paper address situations where the effect definition matches the model assumed—additive effect with linear model, ratio effect with logit/log link model. While this kind of pairing is natural and commonplace, it is somewhat restrictive; there are situations where the effect definition of policy interest may not be on the same effect scale that best matches the model scientifically deemed appropriate. Our ongoing work aims to provide sensitivity analyses to situations where the model assumed is nonlinear but the effect scale of interest is additive.</p>
<p>That these sensitivity analyses rely on the assumption of a specific causal model deserves discussion, as the assumed model may or may not be close to the truth. Method 2, which combines this model with weighting, provides some protection against model misspecification, and thus has a flavor of double robustness. It is not truly doubly robust, however, because the weighting does not adjust for difference in the distribution of the partially unobserved effect modifier <italic>V</italic>. An area for further development is the search for sensitivity analysis procedures that are more flexible regarding model assumptions.</p>
<p>A challenge in generalization which we commented on is that the effect modifier range coverage assumption (A3) is perhaps commonly not met, because trial samples tend to be less diverse than target populations [<xref ref-type="bibr" rid="pone.0208795.ref020">20</xref>]. Strategies for this situation include combining evidence from multiple trials, combining experimental and non-experimental evidence using cross-design synthesis [<xref ref-type="bibr" rid="pone.0208795.ref021">21</xref>], or redefining the population to the area with overlap [<xref ref-type="bibr" rid="pone.0208795.ref022">22</xref>]. These complex approaches will require adapting sensitivity analyses.</p>
<p>Finally, it is important to note that these sensitivity analyses are not a panacea. It is best to limit the need for them in the first place. This can be done through careful consideration of target populations when designing trials, and efforts to enroll more representative trial samples. If that is not possible, trialists should carefully consider potential effect modifiers and investigate treatment effect heterogeneity. Also, to be able to adjust for effect modifiers when generalizing treatment effects, effect modifiers need to be measured consistently in trials and target population datasets [<xref ref-type="bibr" rid="pone.0208795.ref005">5</xref>, <xref ref-type="bibr" rid="pone.0208795.ref023">23</xref>]. We encourage trialists to collect covariates in the same way as is done in common population datasets in their fields. When design strategies fall short, the methods discussed here provide a sense for the robustness (or lack thereof) of results when generalizing to target populations.</p>
</sec>
<sec id="sec019">
<title>Supporting information</title>
<supplementary-material id="pone.0208795.s001" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s001" xlink:type="simple">
<label>S1 Appendix</label>
<caption>
<title>Simulations.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s002" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s002" xlink:type="simple">
<label>S2 Appendix</label>
<caption>
<title>An explanation of why the different weighting procedures apply in the different data scenarios.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s003" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s003" xlink:type="simple">
<label>S3 Appendix</label>
<caption>
<title>Additional details on the case of effect modifiers not observed in the trial.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s004" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s004" xlink:type="simple">
<label>S4 Appendix</label>
<caption>
<title>Additional details on extension 1 for random intercepts models.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s005" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s005" xlink:type="simple">
<label>S5 Appendix</label>
<caption>
<title>Additional details on extension 2 for multiplicative effects and log/logit link models.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s006" mimetype="text/html" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s006" xlink:type="simple">
<label>S6 Appendix</label>
<caption>
<title>Illustration—Main appendix with explanations and most of the code in R (read this before S7-9).</title>
<p>(HTML)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s007" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s007" xlink:type="simple">
<label>S7 Appendix</label>
<caption>
<title>Illustration—Stata code for fitting random effects models with probability weights.</title>
<p>(DO)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s008" mimetype="text/csv" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s008" xlink:type="simple">
<label>S8 Appendix</label>
<caption>
<title>Illustration—Trial data.</title>
<p>(CSV)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0208795.s009" mimetype="text/csv" position="float" xlink:href="info:doi/10.1371/journal.pone.0208795.s009" xlink:type="simple">
<label>S9 Appendix</label>
<caption>
<title>Illustration—Target population data.</title>
<p>(CSV)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>This work was supported in part by NSF grant DRL-1335843 (co-PIs E. A. Stuart and R. B. Olsen), PCORI grant ME-150227794 (co-PIs I. Dahabreh and E. A. Stuart), NIDA grant R01-DA036520 (PI R. Mojtabai), and NIAID grant R01AI100654 (PI S. R. Cole). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript. The authors acknowledge insightful comments from three referees and the academic editor, which helped improve this work.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0208795.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>, <name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>. <article-title>Generalizing evidence from randomized clinical trials to target populations: The ACTG 320 trial</article-title>. <source>American Journal of Epidemiology</source>. <year>2010</year>;<volume>172</volume>(<issue>1</issue>):<fpage>107</fpage>–<lpage>115</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/aje/kwq084" xlink:type="simple">10.1093/aje/kwq084</ext-link></comment> <object-id pub-id-type="pmid">20547574</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tipton</surname> <given-names>E</given-names></name>. <article-title>Improving generalizations from experiments using propensity score subclassification: Assumptions, properties, and contexts</article-title>. <source>Journal of Educational and Behavioral Statistics</source>. <year>2013</year>;<volume>38</volume>(<issue>3</issue>):<fpage>239</fpage>–<lpage>266</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3102/1076998612441947" xlink:type="simple">10.3102/1076998612441947</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kern</surname> <given-names>HL</given-names></name>, <name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Hill</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Green</surname> <given-names>DP</given-names></name>. <article-title>Assessing methods for generalizing experimental impact estimates to target samples</article-title>. <source>Journal of Research on Educational Effectiveness</source>. <year>2016</year>;<volume>9</volume>(<issue>1</issue>):<fpage>103</fpage>–<lpage>127</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/19345747.2015.1060282" xlink:type="simple">10.1080/19345747.2015.1060282</ext-link></comment> <object-id pub-id-type="pmid">27668031</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Bradshaw</surname> <given-names>CP</given-names></name>, <name name-style="western"><surname>Leaf</surname> <given-names>PJ</given-names></name>. <article-title>Assessing the generalizability of randomized trial results to target populations</article-title>. <source>Prevention Science</source>. <year>2015</year>;<volume>16</volume>(<issue>3</issue>):<fpage>475</fpage>–<lpage>485</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11121-014-0513-z" xlink:type="simple">10.1007/s11121-014-0513-z</ext-link></comment> <object-id pub-id-type="pmid">25307417</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Rhodes</surname> <given-names>A</given-names></name>. <article-title>Generalizing treatment effect estimates from sample to population: A case study in the difficulties of finding sufficient data</article-title>. <source>Evaluation Review</source>. <year>2016</year>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1177/0193841X16660663" xlink:type="simple">10.1177/0193841X16660663</ext-link></comment> <object-id pub-id-type="pmid">27491758</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref006">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nguyen</surname> <given-names>TQ</given-names></name>, <name name-style="western"><surname>Ebnesajjad</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>, <name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>. <article-title>Sensitivity analysis for an unobserved moderator in RCT-to-target-population generalization of treatment effects</article-title>. <source>Annals of Applied Statistics</source>. <year>2017</year>;<volume>11</volume>(<issue>1</issue>):<fpage>225</fpage>–<lpage>247</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1214/16-AOAS1001" xlink:type="simple">10.1214/16-AOAS1001</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hammer</surname> <given-names>SM</given-names></name>, <name name-style="western"><surname>Squires</surname> <given-names>KE</given-names></name>, <name name-style="western"><surname>Hughes</surname> <given-names>MD</given-names></name>, <name name-style="western"><surname>Grimes</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Demeter</surname> <given-names>LM</given-names></name>, <name name-style="western"><surname>Currier</surname> <given-names>JS</given-names></name>, <etal>et al</etal>. <article-title>A controlled trial of two nucleoside analogues plus indinavir in persons with human immunodeficiency virus infection and CD4 cell counts of 200 per cubic millimeter or less</article-title>. <source>New England Journal of Medicine</source>. <year>1997</year>;<volume>337</volume>(<issue>11</issue>):<fpage>725</fpage>–<lpage>733</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1056/NEJM199709113371101" xlink:type="simple">10.1056/NEJM199709113371101</ext-link></comment> <object-id pub-id-type="pmid">9287227</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hall</surname> <given-names>HI</given-names></name>, <name name-style="western"><surname>Song</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Rhodes</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Prejean</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>An</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>LM</given-names></name>, <etal>et al</etal>. <article-title>Estimation of HIV incidence in the United States</article-title>. <source>JAMA: The journal of the American Medical Association</source>. <year>2008</year>;<volume>300</volume>(<issue>5</issue>):<fpage>520</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jama.300.5.520" xlink:type="simple">10.1001/jama.300.5.520</ext-link></comment> <object-id pub-id-type="pmid">18677024</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pearl</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Bareinboim</surname> <given-names>E</given-names></name>. <article-title>External validity and transportability: A formal approach</article-title>. <source>JSM Proceedings</source>. <year>2011</year>; p. <fpage>157</fpage>–<lpage>171</lpage>.</mixed-citation>
</ref>
<ref id="pone.0208795.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Rubin</surname> <given-names>DB</given-names></name>. <article-title>Estimating causal effects of treatments in randomized and nonrandomized studies</article-title>. <source>Journal of Educational Psychology</source>. <year>1974</year>;<volume>66</volume>(<issue>5</issue>):<fpage>688</fpage>–<lpage>701</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1037/h0037350" xlink:type="simple">10.1037/h0037350</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pressler</surname> <given-names>TR</given-names></name>, <name name-style="western"><surname>Kaizar</surname> <given-names>EE</given-names></name>. <article-title>The use of propensity scores and observational data to estimate randomized controlled trial generalizability bias</article-title>. <source>Statistics in Medicine</source>. <year>2013</year>;<volume>32</volume>(<issue>20</issue>):<fpage>3552</fpage>–<lpage>3568</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/sim.5802" xlink:type="simple">10.1002/sim.5802</ext-link></comment> <object-id pub-id-type="pmid">23553373</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hartman</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Grieve</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Sekhon</surname> <given-names>JS</given-names></name>. <article-title>From sample average treatment effect to population average treatment effect on the treated: Combining experimental with observational studies to estimate population treatment effects</article-title>. <source>Journal of the Royal Statistical Society: Series A</source>. <year>2015</year>;. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/rssa.12094" xlink:type="simple">10.1111/rssa.12094</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kent</surname> <given-names>DM</given-names></name>, <name name-style="western"><surname>Rothwell</surname> <given-names>PM</given-names></name>, <name name-style="western"><surname>Ioannidis</surname> <given-names>JPA</given-names></name>, <name name-style="western"><surname>Altman</surname> <given-names>DG</given-names></name>, <name name-style="western"><surname>Hayward</surname> <given-names>RA</given-names></name>. <article-title>Assessing and reporting heterogeneity in treatment effects in clinical trials: A proposal</article-title>. <source>Trials</source>. <year>2010</year>;<volume>11</volume>:<fpage>85</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1745-6215-11-85" xlink:type="simple">10.1186/1745-6215-11-85</ext-link></comment> <object-id pub-id-type="pmid">20704705</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wang</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Ware</surname> <given-names>JH</given-names></name>. <article-title>Detecting moderator effects using subgroup analyses</article-title>. <source>Prevention Science</source>. <year>2013</year>;<volume>14</volume>:<fpage>111</fpage>–<lpage>120</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11121-011-0221-x" xlink:type="simple">10.1007/s11121-011-0221-x</ext-link></comment> <object-id pub-id-type="pmid">21562742</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Weiss</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>Bloom</surname> <given-names>HS</given-names></name>, <name name-style="western"><surname>Brock</surname> <given-names>T</given-names></name>. <article-title>A conceptual framework for studying the sources of variation in program effects</article-title>. <source>Journal of Policy Analysis and Management</source>. <year>2014</year>;<volume>33</volume>(<issue>3</issue>):<fpage>778</fpage>–<lpage>808</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/pam.21760" xlink:type="simple">10.1002/pam.21760</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref016">
<label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Varadhan</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Segal</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Boyd</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>AW</given-names></name>, <name name-style="western"><surname>Weiss</surname> <given-names>CO</given-names></name>. <article-title>A framework for the analysis of heterogeneity of treatment effect in patient-centered outcomes research</article-title>. <source>Journal of Clinical Epidemiology</source>. <year>2013</year>;<volume>66</volume>(<issue>8</issue>):<fpage>818</fpage>–<lpage>825</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jclinepi.2013.02.009" xlink:type="simple">10.1016/j.jclinepi.2013.02.009</ext-link></comment> <object-id pub-id-type="pmid">23651763</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lesko</surname> <given-names>CR</given-names></name>, <name name-style="western"><surname>Buchanan</surname> <given-names>AL</given-names></name>, <name name-style="western"><surname>Westreich</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Edwards</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Hudgens</surname> <given-names>MG</given-names></name>, <name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>. <article-title>Generalizing study results: A potential outcomes perspective</article-title>. <source>Epidemiology</source>. <year>2017</year>;. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1097/EDE.0000000000000664" xlink:type="simple">10.1097/EDE.0000000000000664</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Westreich</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Edwards</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Lesko</surname> <given-names>CR</given-names></name>, <name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>. <article-title>Transportability of trial results using inverse odds of sampling weights</article-title>. <source>American Journal of Epidemiology</source>. <year>2017</year>;<volume>186</volume>(<issue>8</issue>):<fpage>1010</fpage>–<lpage>1014</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/aje/kwx164" xlink:type="simple">10.1093/aje/kwx164</ext-link></comment> <object-id pub-id-type="pmid">28535275</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref019">
<label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Westreich</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Edwards</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Rogawski</surname> <given-names>ET</given-names></name>, <name name-style="western"><surname>Hudgens</surname> <given-names>MG</given-names></name>, <name name-style="western"><surname>Stuart</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>. <article-title>Causal impact: Epidemiological approaches for a public health of consequence</article-title>. <source>American Journal of Public Health</source>. <year>2016</year>;<volume>106</volume>(<issue>6</issue>):<fpage>1011</fpage>–<lpage>1012</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2105/AJPH.2016.303226" xlink:type="simple">10.2105/AJPH.2016.303226</ext-link></comment> <object-id pub-id-type="pmid">27153017</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref020">
<label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Humphreys</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Weingardt</surname> <given-names>KR</given-names></name>, <name name-style="western"><surname>Harris</surname> <given-names>AHS</given-names></name>. <article-title>Influence of subject eligibility criteria on compliance with National Institutes of Health guidelines for inclusion of women, minorities, and children in treatment research</article-title>. <source>Alcoholism: Clinical and Experimental Research</source>. <year>2007</year>;<volume>31</volume>(<issue>6</issue>):<fpage>988</fpage>–<lpage>995</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1530-0277.2007.00391.x" xlink:type="simple">10.1111/j.1530-0277.2007.00391.x</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref021">
<label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kaizar</surname> <given-names>EE</given-names></name>. <article-title>Estimating treatment effect via simple cross design synthesis</article-title>. <source>Statistics in Medicine</source>. <year>2011</year>;<volume>30</volume>(<issue>25</issue>):<fpage>2986</fpage>–<lpage>3009</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/sim.4339" xlink:type="simple">10.1002/sim.4339</ext-link></comment> <object-id pub-id-type="pmid">21898521</object-id></mixed-citation>
</ref>
<ref id="pone.0208795.ref022">
<label>22</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tipton</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Fellers</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Caverly</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Vaden-Kiernan</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Borman</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Sullivan</surname> <given-names>K</given-names></name>, <etal>et al</etal>. <article-title>Site selection in experiments: An assessment of site recruitment and generalizability in two scale-up studies</article-title>. <source>Journal of Research on Educational Effectiveness</source>. <year>2016</year>;<volume>9</volume>(<issue>sup1</issue>):<fpage>209</fpage>–<lpage>228</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/19345747.2015.1105895" xlink:type="simple">10.1080/19345747.2015.1105895</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0208795.ref023">
<label>23</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Najafzadeh</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Schneeweiss</surname> <given-names>S</given-names></name>. <article-title>From trial to target populations—Calibrating real-world data</article-title>. <source>New England Journal of Medicine</source>. <year>2017</year>;<volume>376</volume>(<issue>13</issue>):<fpage>1203</fpage>–<lpage>1205</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1056/NEJMp1614720" xlink:type="simple">10.1056/NEJMp1614720</ext-link></comment> <object-id pub-id-type="pmid">28355503</object-id></mixed-citation>
</ref>
</ref-list>
</back>
</article>