<?xml version="1.0" encoding="UTF-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"><channel rdf:about="http://onlinelibrary.wiley.com/rss/journal/10.1111/(ISSN)1541-0420" xmlns="http://purl.org/rss/1.0/"><title>Biometrics</title><description> Wiley Online Library : Biometrics</description><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2F%28ISSN%291541-0420</link><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc</dc:publisher><dc:language xmlns:dc="http://purl.org/dc/elements/1.1/">en</dc:language><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/">© International Biometric Society</dc:rights><prism:issn xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">0006-341X</prism:issn><prism:eIssn xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1541-0420</prism:eIssn><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-03-01T00:00:00-05:00</dc:date><prism:coverDisplayDate xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">March 2013</prism:coverDisplayDate><prism:volume xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">69</prism:volume><prism:number xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:number><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">293</prism:endingPage><image rdf:resource="http://onlinelibrary.wiley.com/store/10.1111/biom.v69.1/asset/cover.gif?v=1&amp;s=c4e722a4ec760be333291d12892d2ee3cdc81ca9"/><items><rdf:Seq><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12033"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12032"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12054"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12026"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12031"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12027"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12025"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2F%2Fbiom.12024"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12023"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12022"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12021"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12019"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12018"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12020"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12007"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12012"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12010"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12006"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12005"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12009"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12016"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12017"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12015"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12013"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12014"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12008"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12011"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01475.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01474.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.1824"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01825.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12003"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01832.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01828.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01808.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01818.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01822.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01810.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01833.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12001"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01809.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01827.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01821.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01795.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01797.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01796.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01806.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12004"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01817.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01819.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01812.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01823.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01807.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12002"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01826.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01831.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01829.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01830.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01824.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01798.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01799.x"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12028"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12029"/><rdf:li rdf:resource="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12030"/></rdf:Seq></items></channel><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12033" xmlns="http://purl.org/rss/1.0/"><title>Naive Hypothesis Testing for Case Series Analysis with Time-Varying Exposure Onset Measurement Error: Inference for Infection-Cardiovascular Risk in Patients on Dialysis</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12033</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Naive Hypothesis Testing for Case Series Analysis with Time-Varying Exposure Onset Measurement Error: Inference for Infection-Cardiovascular Risk in Patients on Dialysis</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sandra M. Mohammed, Lorien S. Dalrymple, Damla Şentürk, Danh V. Nguyen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-06-03T11:08:13.074559-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12033</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12033</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12033</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12033-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>The case series method is useful in studying the relationship between time-varying exposures, such as infections, and acute events observed during the observation periods of individuals. It provides estimates of the relative incidences of events in risk periods (e.g., 30-day period after infections) relative to the baseline periods. When the times of exposure onsets are not known precisely, application of the case series model ignoring exposure onset measurement error leads to biased estimates. Bias-correction is necessary in order to understand the true directions and effect sizes associated with exposure risk periods, although uncorrected estimators have smaller variance. Thus, inference via hypothesis testing based on uncorrected test statistics, if valid, is potentially more powerful. Furthermore, the tests can be implemented in standard software and do not require additional auxiliary data. In this work, we examine the validity and power of naive hypothesis testing, based on applying the case series analysis to the imprecise data without correcting for the error. Based on simulation studies and theoretical calculations, we determine the validity and relative power of common hypothesis tests of interest in case series analysis. In particular, we illustrate that the tests for the global null hypothesis, the overall null hypotheses associated with all risk periods or all age effects are valid. However, tests of individual risk period parameters are not generally valid. Practical guidelines are provided and illustrated with data from patients on dialysis.</p></div></div>
]]></content:encoded><description>


Summary
The case series method is useful in studying the relationship between time-varying exposures, such as infections, and acute events observed during the observation periods of individuals. It provides estimates of the relative incidences of events in risk periods (e.g., 30-day period after infections) relative to the baseline periods. When the times of exposure onsets are not known precisely, application of the case series model ignoring exposure onset measurement error leads to biased estimates. Bias-correction is necessary in order to understand the true directions and effect sizes associated with exposure risk periods, although uncorrected estimators have smaller variance. Thus, inference via hypothesis testing based on uncorrected test statistics, if valid, is potentially more powerful. Furthermore, the tests can be implemented in standard software and do not require additional auxiliary data. In this work, we examine the validity and power of naive hypothesis testing, based on applying the case series analysis to the imprecise data without correcting for the error. Based on simulation studies and theoretical calculations, we determine the validity and relative power of common hypothesis tests of interest in case series analysis. In particular, we illustrate that the tests for the global null hypothesis, the overall null hypotheses associated with all risk periods or all age effects are valid. However, tests of individual risk period parameters are not generally valid. Practical guidelines are provided and illustrated with data from patients on dialysis.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12032" xmlns="http://purl.org/rss/1.0/"><title>Weighted Least-Squares Method for Right-Censored Data in Accelerated Failure Time Model</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12032</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Weighted Least-Squares Method for Right-Censored Data in Accelerated Failure Time Model</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lili Yu, Liang Liu, Ding-Geng(Din) Chen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-31T18:42:35.82754-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12032</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12032</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12032</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">8</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12032-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>The classical accelerated failure time (AFT) model has been extensively investigated due to its direct interpretation of the covariate effects on the mean survival time in survival analysis. However, this classical AFT model and its associated methodologies are built on the fundamental assumption of data homoscedasticity. Consequently, when the homoscedasticity assumption is violated as often seen in the real applications, the estimators lose efficiency and the associated inference is not reliable. Furthermore, none of the existing methods can estimate the intercept consistently. To overcome these drawbacks, we propose a semiparametric approach in this article for both homoscedastic and heteroscedastic data. This approach utilizes a weighted least-squares equation with synthetic observations weighted by square root of their variances where the variances are estimated via the local polynomial regression. We establish the limiting distributions of the resulting coefficient estimators and prove that both slope parameters and the intercept can be consistently estimated. We evaluate the finite sample performance of the proposed approach through simulation studies and demonstrate its superiority through real example on its efficiency and reliability over the existing methods when the data is heteroscedastic.</p></div></div>
]]></content:encoded><description>


Summary
The classical accelerated failure time (AFT) model has been extensively investigated due to its direct interpretation of the covariate effects on the mean survival time in survival analysis. However, this classical AFT model and its associated methodologies are built on the fundamental assumption of data homoscedasticity. Consequently, when the homoscedasticity assumption is violated as often seen in the real applications, the estimators lose efficiency and the associated inference is not reliable. Furthermore, none of the existing methods can estimate the intercept consistently. To overcome these drawbacks, we propose a semiparametric approach in this article for both homoscedastic and heteroscedastic data. This approach utilizes a weighted least-squares equation with synthetic observations weighted by square root of their variances where the variances are estimated via the local polynomial regression. We establish the limiting distributions of the resulting coefficient estimators and prove that both slope parameters and the intercept can be consistently estimated. We evaluate the finite sample performance of the proposed approach through simulation studies and demonstrate its superiority through real example on its efficiency and reliability over the existing methods when the data is heteroscedastic.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12054" xmlns="http://purl.org/rss/1.0/"><title>GEE for Multinomial Responses Using a Local Odds Ratios Parameterization</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12054</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">GEE for Multinomial Responses Using a Local Odds Ratios Parameterization</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Anestis Touloumis, Alan Agresti, Maria Kateri</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-31T18:08:00.426594-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12054</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12054</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12054</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">8</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12054-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>In this article, we propose a generalized estimating equations (GEE) approach for correlated ordinal or nominal multinomial responses using a local odds ratios parameterization. Our motivation lies upon observing that: (i) modeling the dependence between correlated multinomial responses via the local odds ratios is meaningful both for ordinal and nominal response scales and (ii) ordinary GEE methods might not ensure the joint existence of the estimates of the marginal regression parameters and of the dependence structure. To avoid (ii), we treat the so-called “working” association vector <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12054/asset/equation/biom12054-math-0001.gif?v=1&amp;t=hi56oxj3&amp;s=54ab52661f2acbfdab119f1e30446ddccb9cd42f" class="inlineGraphic"/> as a “nuisance” parameter vector that defines the local odds ratios structure at the marginalized contingency tables after tabulating the responses without a covariate adjustment at each time pair. To estimate <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12054/asset/equation/biom12054-math-0002.gif?v=1&amp;t=hi56oxj3&amp;s=cb501df117f3dbcfed1520608cc9eaf098a616df" class="inlineGraphic"/> and simultaneously approximate adequately possible underlying dependence structures, we employ the family of association models proposed by Goodman. In simulations, the parameter estimators with the proposed GEE method for a marginal cumulative probit model appear to be less biased and more efficient than those with the independence “working” model, especially for studies having time-varying covariates and strong correlation.</p></div></div>
]]></content:encoded><description>


Summary
In this article, we propose a generalized estimating equations (GEE) approach for correlated ordinal or nominal multinomial responses using a local odds ratios parameterization. Our motivation lies upon observing that: (i) modeling the dependence between correlated multinomial responses via the local odds ratios is meaningful both for ordinal and nominal response scales and (ii) ordinary GEE methods might not ensure the joint existence of the estimates of the marginal regression parameters and of the dependence structure. To avoid (ii), we treat the so-called “working” association vector α as a “nuisance” parameter vector that defines the local odds ratios structure at the marginalized contingency tables after tabulating the responses without a covariate adjustment at each time pair. To estimate α and simultaneously approximate adequately possible underlying dependence structures, we employ the family of association models proposed by Goodman. In simulations, the parameter estimators with the proposed GEE method for a marginal cumulative probit model appear to be less biased and more efficient than those with the independence “working” model, especially for studies having time-varying covariates and strong correlation.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12026" xmlns="http://purl.org/rss/1.0/"><title>A Revisit to Sample Size and Power Calculations for Testing Odds Ratio in Two Independent Binomials</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12026</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Revisit to Sample Size and Power Calculations for Testing Odds Ratio in Two Independent Binomials</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Fang Liu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-31T17:29:18.581416-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12026</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12026</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12026</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">543</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">549</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12026-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>We reexamine the subject of sample size determination (SSD) when testing logarithm of odds ratio (OR) against zero in two independent binomials. Four common approaches are considered: a closed-form SS formula based on the Wald test (<img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0001.gif?v=1&amp;t=hi56oxj6&amp;s=9e165b3f8d2a0c002305d3fd1a99069fb5bdf876" class="inlineGraphic"/>), closed-form formulas that meet SS requirement by score and exact tests respectively (<img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0002.gif?v=1&amp;t=hi56oxj7&amp;s=b490df91d73c5535de51db87941004316efaf3d7" class="inlineGraphic"/> and <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0003.gif?v=1&amp;t=hi56oxj7&amp;s=f3b91b1076927b65254c4d422ed603951f3687d9" class="inlineGraphic"/>), and a numerical approach to calculating SS based on likelihood ratio (LR) tests (<img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0004.gif?v=1&amp;t=hi56oxj7&amp;s=ddba0f159fe07f0138c7abf16ba6eb09a3185a92" class="inlineGraphic"/>). Several practically useful findings are presented. First, <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0005.gif?v=1&amp;t=hi56oxj8&amp;s=72221506bde7d876a1fb7a49253b3191f7c00900" class="inlineGraphic"/> is a strictly convex function of OR for OR <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0006.gif?v=1&amp;t=hi56oxj8&amp;s=e498762052847cb35b86a582b8b5f76e33add169" class="inlineGraphic"/> and OR <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0007.gif?v=1&amp;t=hi56oxj8&amp;s=6992d0d2d2b04f0bb60f46ee5206ebb2068b1080" class="inlineGraphic"/>, respectively, implying that SS calculated by <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0008.gif?v=1&amp;t=hi56oxj8&amp;s=981c0aeb5d05add00501dc841486ae9f7697662d" class="inlineGraphic"/> does not necessarily decrease as OR gets further away from 1. However, minimum SS often occurs at OR values that are deemed relatively extreme and rare in real life. <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0009.gif?v=1&amp;t=hi56oxj8&amp;s=4b05ffece88c13367e07b8b4aa2f807eb39eacfb" class="inlineGraphic"/>, and <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0010.gif?v=1&amp;t=hi56oxj9&amp;s=ae3c745c2777dbe01109128d93ef349b57f960bc" class="inlineGraphic"/> decrease monotonically as OR diverges from 1. Secondly, the optimal sampling ratio (OSR) between two independent binomials that yields maximum power for a given total SS is not always 1:1 but depends on the odds of outcome in each arm. <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0011.gif?v=1&amp;t=hi56oxj9&amp;s=d4e759e5b5c69ca8b8e2457967b8d084bbe7b5c9" class="inlineGraphic"/> benefits the most from the application of OSR in that total SS can be significantly reduced as compared to the commonly used 1:1 sampling ratio. Savings in SS by OSR in <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0012.gif?v=1&amp;t=hi56oxja&amp;s=fe679df9162a5a8a6e921294debf9f67bbb4503b" class="inlineGraphic"/>, <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0013.gif?v=1&amp;t=hi56oxja&amp;s=1710194274738d8f39eb7b613fc9cea3bd7663b5" class="inlineGraphic"/> and <img alt="inline image" src="http://onlinelibrary.wiley.com/store/10.1111/biom.12026/asset/equation/biom12026-math-0014.gif?v=1&amp;t=hi56oxja&amp;s=9d80c9fe7e09aabf637d87bf37d8c658909b6363" class="inlineGraphic"/> are relatively immaterial from a practical perspective. Finally, we use simulation studies to examine the power loyalty of each SS approach and explore penalized likelihood as a remedy for undermined power loyalty.</p></div></div>
]]></content:encoded><description>


Summary
We reexamine the subject of sample size determination (SSD) when testing logarithm of odds ratio (OR) against zero in two independent binomials. Four common approaches are considered: a closed-form SS formula based on the Wald test (nW), closed-form formulas that meet SS requirement by score and exact tests respectively (nS and nE), and a numerical approach to calculating SS based on likelihood ratio (LR) tests (nL). Several practically useful findings are presented. First, nW is a strictly convex function of OR for OR &gt;1 and OR &lt;1, respectively, implying that SS calculated by nW does not necessarily decrease as OR gets further away from 1. However, minimum SS often occurs at OR values that are deemed relatively extreme and rare in real life. nS,nE, and nL decrease monotonically as OR diverges from 1. Secondly, the optimal sampling ratio (OSR) between two independent binomials that yields maximum power for a given total SS is not always 1:1 but depends on the odds of outcome in each arm. nW benefits the most from the application of OSR in that total SS can be significantly reduced as compared to the commonly used 1:1 sampling ratio. Savings in SS by OSR in nS, nL and nE are relatively immaterial from a practical perspective. Finally, we use simulation studies to examine the power loyalty of each SS approach and explore penalized likelihood as a remedy for undermined power loyalty.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12031" xmlns="http://purl.org/rss/1.0/"><title>Stationarity Tests for Spatial Point Processes using Discrepancies</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12031</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Stationarity Tests for Spatial Point Processes using Discrepancies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sung Nok Chiu, Kwong Ip Liu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-31T17:11:05.995088-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12031</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12031</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12031</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">11</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12031-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>For testing stationarity of a given spatial point pattern, Guan (2008) proposed a model-free statistic, based on the deviations between observed and expected counts of points in expanding regions within the sampling window. This article extends his method to a general class of statistics by incorporating also such information when points are projected to the axes and by allowing different ways to construct regions in which the deviations are considered. The limiting distributions of the new statistics can be expressed in terms of integrals of a Brownian sheet and hence asymptotic critical values can be approximated. A simulation study shows that the new tests are always more powerful than that of Guan. When applied to the longleaf pine data where Guan's test gave an inconclusive answer, the new tests indicate a clear rejection of the stationarity hypothesis.</p></div></div>
]]></content:encoded><description>


Summary
For testing stationarity of a given spatial point pattern, Guan (2008) proposed a model-free statistic, based on the deviations between observed and expected counts of points in expanding regions within the sampling window. This article extends his method to a general class of statistics by incorporating also such information when points are projected to the axes and by allowing different ways to construct regions in which the deviations are considered. The limiting distributions of the new statistics can be expressed in terms of integrals of a Brownian sheet and hence asymptotic critical values can be approximated. A simulation study shows that the new tests are always more powerful than that of Guan. When applied to the longleaf pine data where Guan's test gave an inconclusive answer, the new tests indicate a clear rejection of the stationarity hypothesis.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12027" xmlns="http://purl.org/rss/1.0/"><title>Bridging Conditional and Marginal Inference for Spatially Referenced Binary Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12027</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bridging Conditional and Marginal Inference for Spatially Referenced Binary Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Laura Boehm, Brian J. Reich, Dipankar Bandyopadhyay</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-31T17:05:59.934237-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12027</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12027</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12027</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12027-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>Spatially referenced binary data are common in epidemiology and public health. Owing to its elegant log-odds interpretation of the regression coefficients, a natural model for these data is logistic regression. To account for missing confounding variables that might exhibit a spatial pattern (say, socioeconomic, biological, or environmental conditions), it is customary to include a Gaussian spatial random effect. Conditioned on the spatial random effect, the coefficients may be interpreted as log odds ratios. However, marginally over the random effects, the coefficients no longer preserve the log-odds interpretation, and the estimates are hard to interpret and generalize to other spatial regions. To resolve this issue, we propose a new spatial random effect distribution through a copula framework which ensures that the regression coefficients maintain the log-odds interpretation both conditional on and marginally over the spatial random effects. We present simulations to assess the robustness of our approach to various random effects, and apply it to an interesting dataset assessing periodontal health of Gullah-speaking African Americans. The proposed methodology is flexible enough to handle areal or geo-statistical datasets, and hierarchical models with multiple random intercepts.</p></div></div>
]]></content:encoded><description>


Summary
Spatially referenced binary data are common in epidemiology and public health. Owing to its elegant log-odds interpretation of the regression coefficients, a natural model for these data is logistic regression. To account for missing confounding variables that might exhibit a spatial pattern (say, socioeconomic, biological, or environmental conditions), it is customary to include a Gaussian spatial random effect. Conditioned on the spatial random effect, the coefficients may be interpreted as log odds ratios. However, marginally over the random effects, the coefficients no longer preserve the log-odds interpretation, and the estimates are hard to interpret and generalize to other spatial regions. To resolve this issue, we propose a new spatial random effect distribution through a copula framework which ensures that the regression coefficients maintain the log-odds interpretation both conditional on and marginally over the spatial random effects. We present simulations to assess the robustness of our approach to various random effects, and apply it to an interesting dataset assessing periodontal health of Gullah-speaking African Americans. The proposed methodology is flexible enough to handle areal or geo-statistical datasets, and hierarchical models with multiple random intercepts.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12025" xmlns="http://purl.org/rss/1.0/"><title>An Estimating Function Approach to the Analysis of Recurrent and Terminal Events</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12025</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">An Estimating Function Approach to the Analysis of Recurrent and Terminal Events</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">John D. Kalbfleisch, Douglas E. Schaubel, Yining Ye, Qi Gong</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-07T14:31:40.061416-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12025</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12025</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12025</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">9</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12025-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>In clinical and observational studies,  the event of interest can often recur on the same subject. In a more  complicated situation, there exists a terminal event (e.g., death)  which stops the recurrent event process. In many such instances,  the terminal event is strongly correlated with the recurrent event  process. We consider the recurrent/terminal event setting and model  the dependence through a shared gamma frailty that is included in  both the recurrent event rate and terminal event hazard functions.  Conditional on the frailty, a model is specified only for the  marginal recurrent event process, hence avoiding the strong  Poisson-type assumptions traditionally used. Analysis is based on  estimating functions that allow for estimation of covariate effects  on the recurrent event rate and terminal  event hazard. The method also permits estimation of the degree of  association between the two processes. Closed-form asymptotic  variance estimators are proposed. The proposed method is evaluated  through simulations to assess the applicability of the asymptotic  results in finite samples and the sensitivity of the method to its  underlying assumptions. The methods can be extended in  straightforward ways to accommodate multiple types of recurrent and  terminal events. Finally, the methods are illustrated in an analysis  of hospitalization data for patients in an international multi-center study of outcomes among dialysis patients.</p></div></div>
]]></content:encoded><description>


Summary
In clinical and observational studies,  the event of interest can often recur on the same subject. In a more  complicated situation, there exists a terminal event (e.g., death)  which stops the recurrent event process. In many such instances,  the terminal event is strongly correlated with the recurrent event  process. We consider the recurrent/terminal event setting and model  the dependence through a shared gamma frailty that is included in  both the recurrent event rate and terminal event hazard functions.  Conditional on the frailty, a model is specified only for the  marginal recurrent event process, hence avoiding the strong  Poisson-type assumptions traditionally used. Analysis is based on  estimating functions that allow for estimation of covariate effects  on the recurrent event rate and terminal  event hazard. The method also permits estimation of the degree of  association between the two processes. Closed-form asymptotic  variance estimators are proposed. The proposed method is evaluated  through simulations to assess the applicability of the asymptotic  results in finite samples and the sensitivity of the method to its  underlying assumptions. The methods can be extended in  straightforward ways to accommodate multiple types of recurrent and  terminal events. Finally, the methods are illustrated in an analysis  of hospitalization data for patients in an international multi-center study of outcomes among dialysis patients.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2F%2Fbiom.12024" xmlns="http://purl.org/rss/1.0/"><title>Partially Linear Structure Selection in Cox Models with Varying Coefficients</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2F%2Fbiom.12024</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Partially Linear Structure Selection in Cox Models with Varying Coefficients</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Heng Lian, Peng Lai, Hua Liang</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-02T06:12:16.98681-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111//biom.12024</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111//biom.12024</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2F%2Fbiom.12024</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12024-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>To explore the nonlinear interactions between covariates and an index variable, partially linear proportional hazards models have been proposed for censored survival data. However, specification of the partially linear structure was usually carried out in an ad-hoc manner by first fitting a full varying-coefficient model and visually examining the resulting fit to identify the linear part. In this article, we consider the problem of coefficient estimation and constant coefficient identification based on a double shrinkage approach. Variable selection is also considered in a coherent estimation framework, resulting in a double-penalization procedure. Under the mild assumptions, we establish asymptotic properties for the procedure such as consistency, sparesistency, constansistency, and asymptotic normality. We evaluate the performance of the proposed method by numerical simulations and demonstrate its application using a breast cancer data set.</p></div></div>
]]></content:encoded><description>


Summary
To explore the nonlinear interactions between covariates and an index variable, partially linear proportional hazards models have been proposed for censored survival data. However, specification of the partially linear structure was usually carried out in an ad-hoc manner by first fitting a full varying-coefficient model and visually examining the resulting fit to identify the linear part. In this article, we consider the problem of coefficient estimation and constant coefficient identification based on a double shrinkage approach. Variable selection is also considered in a coherent estimation framework, resulting in a double-penalization procedure. Under the mild assumptions, we establish asymptotic properties for the procedure such as consistency, sparesistency, constansistency, and asymptotic normality. We evaluate the performance of the proposed method by numerical simulations and demonstrate its application using a breast cancer data set.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12023" xmlns="http://purl.org/rss/1.0/"><title>Partly Conditional Estimation of the Effect of a Time-Dependent Factor in the Presence of Dependent Censoring</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12023</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Partly Conditional Estimation of the Effect of a Time-Dependent Factor in the Presence of Dependent Censoring</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Qi Gong, Douglas E. Schaubel</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-05-02T06:08:25.789134-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12023</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12023</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12023</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12023-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>We propose semiparametric methods for estimating the effect of a  time-dependent covariate on treatment-free survival. The data  structure of interest consists of a longitudinal sequence of  measurements and a potentially censored survival time. The factor of  interest is time-dependent. Treatment-free survival is of interest  and is dependently censored by the receipt of treatment. Patients  may be removed from consideration for treatment, temporarily or  permanently. The proposed methods combine landmark analysis and  partly conditional hazard regression. A set of calendar time cross-sections is specified, and  survival time (from cross-section date) is modeled through weighted Cox regression.  The assumed model for death is marginal in the sense that time-varying  covariates are taken as fixed at each landmark, with the mortality  hazard function implicitly averaging across future covariate  trajectories. Dependent censoring is  overcome by a variant of inverse probability of censoring weighting (IPCW). The proposed  estimators are shown to be consistent and asymptotically normal,  with consistent covariance estimators provided. Simulation studies  reveal that the proposed estimation procedures are appropriate for  practical use. We apply the proposed methods to pre-transplant mortality among end-stage liver disease (ESLD) patients.</p></div></div>
]]></content:encoded><description>


Summary
We propose semiparametric methods for estimating the effect of a  time-dependent covariate on treatment-free survival. The data  structure of interest consists of a longitudinal sequence of  measurements and a potentially censored survival time. The factor of  interest is time-dependent. Treatment-free survival is of interest  and is dependently censored by the receipt of treatment. Patients  may be removed from consideration for treatment, temporarily or  permanently. The proposed methods combine landmark analysis and  partly conditional hazard regression. A set of calendar time cross-sections is specified, and  survival time (from cross-section date) is modeled through weighted Cox regression.  The assumed model for death is marginal in the sense that time-varying  covariates are taken as fixed at each landmark, with the mortality  hazard function implicitly averaging across future covariate  trajectories. Dependent censoring is  overcome by a variant of inverse probability of censoring weighting (IPCW). The proposed  estimators are shown to be consistent and asymptotically normal,  with consistent covariance estimators provided. Simulation studies  reveal that the proposed estimation procedures are appropriate for  practical use. We apply the proposed methods to pre-transplant mortality among end-stage liver disease (ESLD) patients.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12022" xmlns="http://purl.org/rss/1.0/"><title>Identification and Efficient Estimation of the Natural Direct Effect among the Untreated</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12022</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Identification and Efficient Estimation of the Natural Direct Effect among the Untreated</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Samuel D. Lendle, Meenakshi S. Subbaraman, Mark J. van der Laan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-23T05:29:58.663567-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12022</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12022</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12022</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">8</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12022-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>The natural direct effect (NDE), or the effect of an exposure on an outcome if an   intermediate variable was set to the level it would have been in the absence of the exposure, is often of   interest to investigators. In general, the statistical parameter associated with the NDE is difficult to estimate   in the non-parametric model, particularly when the intermediate variable is continuous or high dimensional. In   this article, we introduce a new causal parameter called the natural direct effect among the untreated, discus   identifiability assumptions, propose a sensitivity analysis for some of the assumptions, and show that this new   parameter is equivalent to the NDE in a randomized controlled trial. We also present a targeted minimum loss   estimator (TMLE), a locally efficient, double robust substitution estimator for the statistical parameter   associated with this causal parameter. The TMLE can be applied to problems with continuous and high dimensional   intermediate variables, and can be used to estimate the NDE in a randomized controlled trial with such data.   Additionally, we define and discuss the estimation of three related causal parameters: the natural direct effect  among the treated, the indirect effect among the untreated and the indirect effect among the treated.</p></div></div>
]]></content:encoded><description>


Summary
The natural direct effect (NDE), or the effect of an exposure on an outcome if an   intermediate variable was set to the level it would have been in the absence of the exposure, is often of   interest to investigators. In general, the statistical parameter associated with the NDE is difficult to estimate   in the non-parametric model, particularly when the intermediate variable is continuous or high dimensional. In   this article, we introduce a new causal parameter called the natural direct effect among the untreated, discus   identifiability assumptions, propose a sensitivity analysis for some of the assumptions, and show that this new   parameter is equivalent to the NDE in a randomized controlled trial. We also present a targeted minimum loss   estimator (TMLE), a locally efficient, double robust substitution estimator for the statistical parameter   associated with this causal parameter. The TMLE can be applied to problems with continuous and high dimensional   intermediate variables, and can be used to estimate the NDE in a randomized controlled trial with such data.   Additionally, we define and discuss the estimation of three related causal parameters: the natural direct effect  among the treated, the indirect effect among the untreated and the indirect effect among the treated.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12021" xmlns="http://purl.org/rss/1.0/"><title>Joint High-Dimensional Bayesian Variable and Covariance Selection with an Application to eQTL Analysis</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12021</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Joint High-Dimensional Bayesian Variable and Covariance Selection with an Application to eQTL Analysis</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Anindya Bhadra, Bani K. Mallick</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-22T11:57:22.878859-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12021</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12021</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12021</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12021-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>We describe a Bayesian technique to (a) perform a sparse joint selection of significant predictor variables and significant inverse covariance matrix elements of the response variables in a high-dimensional linear Gaussian sparse seemingly unrelated regression (SSUR) setting and (b) perform an association analysis between the high-dimensional sets of predictors and responses in such a setting. To search the high-dimensional model space, where both the number of predictors and the number of possibly correlated responses can be larger than the sample size, we demonstrate that a marginalization-based collapsed Gibbs sampler, in combination with spike and slab type of priors, offers a computationally feasible and efficient solution. As an example, we apply our method to an expression quantitative trait loci (eQTL) analysis on publicly available single nucleotide polymorphism (SNP) and gene expression data for humans where the primary interest lies in finding the significant associations between the sets of SNPs and possibly correlated genetic transcripts. Our method also allows for inference on the sparse interaction network of the transcripts (response variables) after accounting for the effect of the SNPs (predictor variables). We exploit properties of Gaussian graphical models to make statements concerning conditional independence of the responses. Our method compares favorably to existing Bayesian approaches developed for this purpose.</p></div></div>
]]></content:encoded><description>


Summary
We describe a Bayesian technique to (a) perform a sparse joint selection of significant predictor variables and significant inverse covariance matrix elements of the response variables in a high-dimensional linear Gaussian sparse seemingly unrelated regression (SSUR) setting and (b) perform an association analysis between the high-dimensional sets of predictors and responses in such a setting. To search the high-dimensional model space, where both the number of predictors and the number of possibly correlated responses can be larger than the sample size, we demonstrate that a marginalization-based collapsed Gibbs sampler, in combination with spike and slab type of priors, offers a computationally feasible and efficient solution. As an example, we apply our method to an expression quantitative trait loci (eQTL) analysis on publicly available single nucleotide polymorphism (SNP) and gene expression data for humans where the primary interest lies in finding the significant associations between the sets of SNPs and possibly correlated genetic transcripts. Our method also allows for inference on the sparse interaction network of the transcripts (response variables) after accounting for the effect of the SNPs (predictor variables). We exploit properties of Gaussian graphical models to make statements concerning conditional independence of the responses. Our method compares favorably to existing Bayesian approaches developed for this purpose.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12019" xmlns="http://purl.org/rss/1.0/"><title>Bayesian Inference for Two-Phase Studies with Categorical Covariates</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12019</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian Inference for Two-Phase Studies with Categorical Covariates</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Michelle Ross, Jon Wakefield</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-22T11:43:31.49049-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12019</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12019</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12019</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12019-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>In this article, we consider two-phase sampling in the situation in which all covariates are categorical. Two-phase designs are appealing from an efficiency perspective since they allow sampling to be concentrated in informative cells. A number of likelihood-based methods have been developed for the analysis of two-phase data, but we describe a Bayesian approach which has previously been unavailable. The methods are first compared with existing approaches via a simulation study, and are then applied to data collected on Wilms tumor. The benefits of a Bayesian approach include relaxation of the reliance on asymptotic inference, particularly in sparse data situations, and the potential to model data with complex dependencies, for example, via the introduction of random effects. The sparse data situation is illustrated via a simulated example.</p></div></div>
]]></content:encoded><description>


Summary
In this article, we consider two-phase sampling in the situation in which all covariates are categorical. Two-phase designs are appealing from an efficiency perspective since they allow sampling to be concentrated in informative cells. A number of likelihood-based methods have been developed for the analysis of two-phase data, but we describe a Bayesian approach which has previously been unavailable. The methods are first compared with existing approaches via a simulation study, and are then applied to data collected on Wilms tumor. The benefits of a Bayesian approach include relaxation of the reliance on asymptotic inference, particularly in sparse data situations, and the potential to model data with complex dependencies, for example, via the introduction of random effects. The sparse data situation is illustrated via a simulated example.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12018" xmlns="http://purl.org/rss/1.0/"><title>Objective Bayesian Search of Gaussian Directed Acyclic Graphical Models for Ordered Variables with Non-Local Priors</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12018</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Objective Bayesian Search of Gaussian Directed Acyclic Graphical Models for Ordered Variables with Non-Local Priors</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Davide Altomare, Guido Consonni, Luca La Rocca</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-05T12:27:53.362435-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12018</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12018</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12018</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12018-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>Directed acyclic graphical (DAG) models are increasingly employed  in the study of physical and biological systems to model  direct influences between variables.  Identifying the graph from data is a challenging endeavor,  which can be more reasonably tackled if the variables are assumed to satisfy  a given ordering;  in this case we simply have to estimate the presence or absence of each potential edge.  Working under this assumption,  we propose an objective Bayesian method for searching the space of Gaussian DAG models,  which provides a rich output from minimal input.  We base our analysis on <em>non-local</em> parameter priors,  which are especially suited for learning sparse graphs,  because they allow a faster learning rate,  relative to ordinary <em>local</em> parameter priors,  when the true unknown sampling distribution belongs to a simple model.  We implement an efficient stochastic search algorithm, which deals effectively  with data sets having sample size smaller than the number of variables,  and apply our method to a variety of simulated and real data sets.  Our approach compares favorably,  in terms of the ROC curve for edge hit rate versus false alarm rate,  to current state-of-the-art frequentist methods  relying on the assumption of ordered variables;  under this assumption it exhibits a competitive advantage over the PC-algorithm,  which can be considered as a frequentist benchmark for unordered variables.  Importantly, we find that our method is still at an advantage  for learning the skeleton of the DAG,  when the ordering of the variables is only moderately mis-specified.  Prospectively, our method could be coupled with  a strategy to learn the order of the variables, thus dropping the known ordering assumption.</p></div></div>
]]></content:encoded><description>


Summary
Directed acyclic graphical (DAG) models are increasingly employed  in the study of physical and biological systems to model  direct influences between variables.  Identifying the graph from data is a challenging endeavor,  which can be more reasonably tackled if the variables are assumed to satisfy  a given ordering;  in this case we simply have to estimate the presence or absence of each potential edge.  Working under this assumption,  we propose an objective Bayesian method for searching the space of Gaussian DAG models,  which provides a rich output from minimal input.  We base our analysis on non-local parameter priors,  which are especially suited for learning sparse graphs,  because they allow a faster learning rate,  relative to ordinary local parameter priors,  when the true unknown sampling distribution belongs to a simple model.  We implement an efficient stochastic search algorithm, which deals effectively  with data sets having sample size smaller than the number of variables,  and apply our method to a variety of simulated and real data sets.  Our approach compares favorably,  in terms of the ROC curve for edge hit rate versus false alarm rate,  to current state-of-the-art frequentist methods  relying on the assumption of ordered variables;  under this assumption it exhibits a competitive advantage over the PC-algorithm,  which can be considered as a frequentist benchmark for unordered variables.  Importantly, we find that our method is still at an advantage  for learning the skeleton of the DAG,  when the ordering of the variables is only moderately mis-specified.  Prospectively, our method could be coupled with  a strategy to learn the order of the variables, thus dropping the known ordering assumption.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12020" xmlns="http://purl.org/rss/1.0/"><title>Regularization in Finite Mixture of Regression Models with Diverging Number of Parameters</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12020</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Regularization in Finite Mixture of Regression Models with Diverging Number of Parameters</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Abbas Khalili, Shili Lin</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-04T14:22:42.463903-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12020</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12020</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12020</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">ORIGINAL ARTICLE</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3>
<div class="section" id="biom12020-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><h4>Summary</h4><div class="para"><p>Feature (variable) selection has become a fundamentally important problem in recent statistical literature. Sometimes, in applications, many variables are introduced to reduce possible modeling biases, but the number of variables a model can accommodate is often limited by the amount of data available. In other words, the number of variables considered depends on the sample size, which reflects the estimability of the parametric model. In this article, we consider the problem of feature selection in finite mixture of regression models when the number of parameters in the model can increase with the sample size. We propose a penalized likelihood approach for feature selection in these models. Under certain regularity conditions, our approach leads to consistent variable selection. We carry out extensive simulation studies to evaluate the performance of the proposed approach under controlled settings. We also applied the proposed method to two real data. The first is on telemonitoring of Parkinson's disease (PD), where the problem concerns whether dysphonic features extracted from the patients’ speech signals recorded at home can be used as surrogates to study PD severity and progression. The second is on breast cancer prognosis, in which one is interested in assessing whether cell nuclear features may offer prognostic values on long-term survival of breast cancer patients. Our analysis in each of the application revealed a mixture structure in the study population and uncovered a unique relationship between the features and the response variable in each of the mixture component.</p></div></div>
]]></content:encoded><description>


Summary
Feature (variable) selection has become a fundamentally important problem in recent statistical literature. Sometimes, in applications, many variables are introduced to reduce possible modeling biases, but the number of variables a model can accommodate is often limited by the amount of data available. In other words, the number of variables considered depends on the sample size, which reflects the estimability of the parametric model. In this article, we consider the problem of feature selection in finite mixture of regression models when the number of parameters in the model can increase with the sample size. We propose a penalized likelihood approach for feature selection in these models. Under certain regularity conditions, our approach leads to consistent variable selection. We carry out extensive simulation studies to evaluate the performance of the proposed approach under controlled settings. We also applied the proposed method to two real data. The first is on telemonitoring of Parkinson's disease (PD), where the problem concerns whether dysphonic features extracted from the patients’ speech signals recorded at home can be used as surrogates to study PD severity and progression. The second is on breast cancer prognosis, in which one is interested in assessing whether cell nuclear features may offer prognostic values on long-term survival of breast cancer patients. Our analysis in each of the application revealed a mixture structure in the study population and uncovered a unique relationship between the features and the response variable in each of the mixture component.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12007" xmlns="http://purl.org/rss/1.0/"><title>A Bayesian Goodness of Fit Test and Semiparametric Generalization of Logistic Regression with Measurement Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12007</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Bayesian Goodness of Fit Test and Semiparametric Generalization of Logistic Regression with Measurement Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Angela Schörgendorfer, Adam J. Branscum, Timothy E. Hanson</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-03-14T17:34:01.638595-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12007</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12007</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12007</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Logistic regression is a popular tool for risk analysis in medical and population health science. With continuous response data, it is common to create a dichotomous outcome for logistic regression analysis by specifying a threshold for positivity. Fitting a linear regression to the nondichotomized response variable assuming a logistic sampling model for the data has been empirically shown to yield more efficient estimates of odds ratios than ordinary logistic regression of the dichotomized endpoint. We illustrate that risk inference is not robust to departures from the parametric logistic distribution. Moreover, the model assumption of proportional odds is generally not satisfied when the condition of a logistic distribution for the data is violated, leading to biased inference from a parametric logistic analysis. We develop novel Bayesian semiparametric methodology for testing goodness of fit of parametric logistic regression with continuous measurement data. The testing procedures hold for any cutoff threshold and our approach simultaneously provides the ability to perform semiparametric risk estimation. Bayes factors are calculated using the Savage–Dickey ratio for testing the null hypothesis of logistic regression versus a semiparametric generalization. We propose a fully Bayesian and a computationally efficient empirical Bayesian approach to testing, and we present methods for semiparametric estimation of risks, relative risks, and odds ratios when parametric logistic regression fails. Theoretical results establish the consistency of the empirical Bayes test. Results from simulated data show that the proposed approach provides accurate inference irrespective of whether parametric assumptions hold or not. Evaluation of risk factors for obesity shows that different inferences are derived from an analysis of a real data set when deviations from a logistic distribution are permissible in a flexible semiparametric framework.</p></div>
]]></content:encoded><description>
Summary Logistic regression is a popular tool for risk analysis in medical and population health science. With continuous response data, it is common to create a dichotomous outcome for logistic regression analysis by specifying a threshold for positivity. Fitting a linear regression to the nondichotomized response variable assuming a logistic sampling model for the data has been empirically shown to yield more efficient estimates of odds ratios than ordinary logistic regression of the dichotomized endpoint. We illustrate that risk inference is not robust to departures from the parametric logistic distribution. Moreover, the model assumption of proportional odds is generally not satisfied when the condition of a logistic distribution for the data is violated, leading to biased inference from a parametric logistic analysis. We develop novel Bayesian semiparametric methodology for testing goodness of fit of parametric logistic regression with continuous measurement data. The testing procedures hold for any cutoff threshold and our approach simultaneously provides the ability to perform semiparametric risk estimation. Bayes factors are calculated using the Savage–Dickey ratio for testing the null hypothesis of logistic regression versus a semiparametric generalization. We propose a fully Bayesian and a computationally efficient empirical Bayesian approach to testing, and we present methods for semiparametric estimation of risks, relative risks, and odds ratios when parametric logistic regression fails. Theoretical results establish the consistency of the empirical Bayes test. Results from simulated data show that the proposed approach provides accurate inference irrespective of whether parametric assumptions hold or not. Evaluation of risk factors for obesity shows that different inferences are derived from an analysis of a real data set when deviations from a logistic distribution are permissible in a flexible semiparametric framework.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12012" xmlns="http://purl.org/rss/1.0/"><title>A Joint Regression Analysis for Genetic Association Studies with Outcome Stratified Samples</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12012</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Joint Regression Analysis for Genetic Association Studies with Outcome Stratified Samples</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Colin O. Wu, Gang Zheng, Minjung Kwak</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-03-14T14:26:23.828637-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12012</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12012</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12012</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Genetic association studies in practice often involve multiple traits resulting from a common disease mechanism, and samples for such studies are often stratified based on some trait outcomes. In such situations, statistical methods using only one of these traits may be inadequate and lead to under-powered tests for detecting genetic associations. We propose in this article an estimation and testing procedure for evaluating the shared-association of a genetic marker on the joint distribution of multiple traits of a common disease. Specifically, we assume that the disease mechanism involves both quantitative and qualitative traits, and our samples could be stratified based on the qualitative trait. Through a joint likelihood function, we derive a class of estimators and test statistics for evaluating the shared genetic association on both the quantitative and qualitative traits. Our simulation study shows that the joint likelihood test procedure is potentially more powerful than association tests based on separate traits. Application of our proposed procedure is demonstrated through the rheumatoid arthritis data provided by the Genetic Analysis Workshop 16 (GAW16).</p></div>
]]></content:encoded><description>
Summary Genetic association studies in practice often involve multiple traits resulting from a common disease mechanism, and samples for such studies are often stratified based on some trait outcomes. In such situations, statistical methods using only one of these traits may be inadequate and lead to under-powered tests for detecting genetic associations. We propose in this article an estimation and testing procedure for evaluating the shared-association of a genetic marker on the joint distribution of multiple traits of a common disease. Specifically, we assume that the disease mechanism involves both quantitative and qualitative traits, and our samples could be stratified based on the qualitative trait. Through a joint likelihood function, we derive a class of estimators and test statistics for evaluating the shared genetic association on both the quantitative and qualitative traits. Our simulation study shows that the joint likelihood test procedure is potentially more powerful than association tests based on separate traits. Application of our proposed procedure is demonstrated through the rheumatoid arthritis data provided by the Genetic Analysis Workshop 16 (GAW16).
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12010" xmlns="http://purl.org/rss/1.0/"><title>Quantile Regression for Recurrent Gap Time Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12010</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Quantile Regression for Recurrent Gap Time Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xianghua Luo, Chiung-Yu Huang, Lan Wang</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-03-11T12:50:01.984598-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12010</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12010</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12010</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Evaluating covariate effects on gap times between successive recurrent events is of interest in many medical and public health studies. While most existing methods for recurrent gap time analysis focus on modeling the hazard function of gap times, a direct interpretation of the covariate effects on the gap times is not available through these methods. In this article, we consider quantile regression that can provide direct assessment of covariate effects on the quantiles of the gap time distribution. Following the spirit of the weighted risk-set method by <a href="#b16" rel="references:#b16">Luo and Huang (2011</a>, <em>Statistics in Medicine</em> <b>30</b>, 301–311), we extend the martingale-based estimating equation method considered by <a href="#b18" rel="references:#b18">Peng and Huang (2008</a>, <em>Journal of the American Statistical Association</em> <b>103</b>, 637–649) for univariate survival data to analyze recurrent gap time data. The proposed estimation procedure can be easily implemented in existing software for univariate censored quantile regression. Uniform consistency and weak convergence of the proposed estimators are established. Monte Carlo studies demonstrate the effectiveness of the proposed method. An application to data from the Danish Psychiatric Central Register is presented to illustrate the methods developed in this article.</p></div>
]]></content:encoded><description>
Summary Evaluating covariate effects on gap times between successive recurrent events is of interest in many medical and public health studies. While most existing methods for recurrent gap time analysis focus on modeling the hazard function of gap times, a direct interpretation of the covariate effects on the gap times is not available through these methods. In this article, we consider quantile regression that can provide direct assessment of covariate effects on the quantiles of the gap time distribution. Following the spirit of the weighted risk-set method by Luo and Huang (2011, Statistics in Medicine 30, 301–311), we extend the martingale-based estimating equation method considered by Peng and Huang (2008, Journal of the American Statistical Association 103, 637–649) for univariate survival data to analyze recurrent gap time data. The proposed estimation procedure can be easily implemented in existing software for univariate censored quantile regression. Uniform consistency and weak convergence of the proposed estimators are established. Monte Carlo studies demonstrate the effectiveness of the proposed method. An application to data from the Danish Psychiatric Central Register is presented to illustrate the methods developed in this article.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12006" xmlns="http://purl.org/rss/1.0/"><title>A Generalized Kruskal–Wallis Test Incorporating Group Uncertainty with Application to Genetic Association Studies</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12006</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Generalized Kruskal–Wallis Test Incorporating Group Uncertainty with Application to Genetic Association Studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Elif F. Acar, Lei Sun</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-26T12:35:09.78955-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12006</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12006</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12006</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Motivated by genetic association studies of SNPs with genotype uncertainty, we propose a generalization of the Kruskal–Wallis test that incorporates group uncertainty when comparing <span class="mathematics"><em>k</em></span> samples. The extended test statistic is based on probability-weighted rank-sums and follows an asymptotic chi-square distribution with <span class="mathematics"><em>k</em>− 1</span> degrees of freedom under the null hypothesis. Simulation studies confirm the validity and robustness of the proposed test in finite samples. Application to a genome-wide association study of type 1 diabetic complications further demonstrates the utilities of this generalized Kruskal–Wallis test for studies with group uncertainty. The method has been implemented as an open-resource R program, <em>GKW</em>.</p></div>
]]></content:encoded><description>
Summary Motivated by genetic association studies of SNPs with genotype uncertainty, we propose a generalization of the Kruskal–Wallis test that incorporates group uncertainty when comparing k samples. The extended test statistic is based on probability-weighted rank-sums and follows an asymptotic chi-square distribution with k− 1 degrees of freedom under the null hypothesis. Simulation studies confirm the validity and robustness of the proposed test in finite samples. Application to a genome-wide association study of type 1 diabetic complications further demonstrates the utilities of this generalized Kruskal–Wallis test for studies with group uncertainty. The method has been implemented as an open-resource R program, GKW.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12005" xmlns="http://purl.org/rss/1.0/"><title>A Causal Model for Joint Evaluation of Placebo and Treatment-Specific Effects in Clinical Trials</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12005</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Causal Model for Joint Evaluation of Placebo and Treatment-Specific Effects in Clinical Trials</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhiwei Zhang, Richard M. Kotz, Chenguang Wang, Shiling Ruan, Martin Ho</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-22T16:05:54.222337-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12005</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12005</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12005</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Evaluation of medical treatments is frequently complicated by the presence of substantial placebo effects, especially on relatively subjective endpoints, and the standard solution to this problem is a randomized, double-blinded, placebo-controlled clinical trial. However, effective blinding does not guarantee that all patients have the same belief or mentality about which treatment they have received (or treatmentality, for brevity), making it difficult to interpret the usual intent-to-treat effect as a causal effect. We discuss the causal relationships among treatment, treatmentality and the clinical outcome of interest, and propose a causal model for joint evaluation of placebo and treatment-specific effects. The model highlights the importance of measuring and incorporating patient treatmentality and suggests that each treatment group should be considered a separate observational study with a patient’s treatmentality playing the role of an uncontrolled exposure. This perspective allows us to adapt existing methods for dealing with confounding to joint estimation of placebo and treatment-specific effects using measured treatmentality data, commonly known as blinding assessment data. We first apply this approach to the most common type of blinding assessment data, which is categorical, and illustrate the methods using an example from asthma. We then propose that blinding assessment data can be collected as a continuous variable, specifically when a patient’s treatmentality is measured as a subjective probability, and describe analytic methods for that case.</p></div>
]]></content:encoded><description>
Summary Evaluation of medical treatments is frequently complicated by the presence of substantial placebo effects, especially on relatively subjective endpoints, and the standard solution to this problem is a randomized, double-blinded, placebo-controlled clinical trial. However, effective blinding does not guarantee that all patients have the same belief or mentality about which treatment they have received (or treatmentality, for brevity), making it difficult to interpret the usual intent-to-treat effect as a causal effect. We discuss the causal relationships among treatment, treatmentality and the clinical outcome of interest, and propose a causal model for joint evaluation of placebo and treatment-specific effects. The model highlights the importance of measuring and incorporating patient treatmentality and suggests that each treatment group should be considered a separate observational study with a patient’s treatmentality playing the role of an uncontrolled exposure. This perspective allows us to adapt existing methods for dealing with confounding to joint estimation of placebo and treatment-specific effects using measured treatmentality data, commonly known as blinding assessment data. We first apply this approach to the most common type of blinding assessment data, which is categorical, and illustrate the methods using an example from asthma. We then propose that blinding assessment data can be collected as a continuous variable, specifically when a patient’s treatmentality is measured as a subjective probability, and describe analytic methods for that case.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12009" xmlns="http://purl.org/rss/1.0/"><title>Exact Goodness-of-Fit Tests for Markov Chains</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12009</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Exact Goodness-of-Fit Tests for Markov Chains</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">J. Besag, D. Mondal</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-21T12:46:48.623133-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12009</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12009</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12009</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Goodness-of-fit tests are useful in assessing whether a statistical model is consistent with available data. However, the usual <span class="mathematics">χ<sup>2</sup></span> asymptotics often fail, either because of the paucity of the data or because a nonstandard test statistic is of interest. In this article, we describe exact goodness-of-fit tests for first- and higher order Markov chains, with particular attention given to time-reversible ones. The tests are obtained by conditioning on the sufficient statistics for the transition probabilities and are implemented by simple Monte Carlo sampling or by Markov chain Monte Carlo. They apply both to single and to multiple sequences and allow a free choice of test statistic. Three examples are given. The first concerns multiple sequences of dry and wet January days for the years 1948–1983 at Snoqualmie Falls, Washington State, and suggests that standard analysis may be misleading. The second one is for a four-state DNA sequence and lends support to the original conclusion that a second-order Markov chain provides an adequate fit to the data. The last one is six-state atomistic data arising in molecular conformational dynamics simulation of solvated alanine dipeptide and points to strong evidence against a first-order reversible Markov chain at 6 picosecond time steps.</p></div>
]]></content:encoded><description>
Summary Goodness-of-fit tests are useful in assessing whether a statistical model is consistent with available data. However, the usual χ2 asymptotics often fail, either because of the paucity of the data or because a nonstandard test statistic is of interest. In this article, we describe exact goodness-of-fit tests for first- and higher order Markov chains, with particular attention given to time-reversible ones. The tests are obtained by conditioning on the sufficient statistics for the transition probabilities and are implemented by simple Monte Carlo sampling or by Markov chain Monte Carlo. They apply both to single and to multiple sequences and allow a free choice of test statistic. Three examples are given. The first concerns multiple sequences of dry and wet January days for the years 1948–1983 at Snoqualmie Falls, Washington State, and suggests that standard analysis may be misleading. The second one is for a four-state DNA sequence and lends support to the original conclusion that a second-order Markov chain provides an adequate fit to the data. The last one is six-state atomistic data arising in molecular conformational dynamics simulation of solvated alanine dipeptide and points to strong evidence against a first-order reversible Markov chain at 6 picosecond time steps.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12016" xmlns="http://purl.org/rss/1.0/"><title>Mark-Specific Hazard Ratio Model with Multivariate Continuous Marks: An Application to Vaccine Efficacy</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12016</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Mark-Specific Hazard Ratio Model with Multivariate Continuous Marks: An Application to Vaccine Efficacy</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">M. Juraska, P. B. Gilbert</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-19T12:09:53.804294-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12016</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12016</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12016</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> In randomized placebo-controlled preventive HIV vaccine efficacy trials, an objective is to evaluate the relationship between vaccine efficacy to prevent infection and genetic distances of the exposing HIV strains to the multiple HIV sequences included in the vaccine construct, where the set of genetic distances is considered as the continuous multivariate “mark” observed in infected subjects only. This research develops a multivariate mark-specific hazard ratio model in the competing risks failure time analysis framework for the assessment of mark-specific vaccine efficacy. It allows improved efficiency of estimation by employing the semiparametric method of maximum profile likelihood estimation in the vaccine-to-placebo mark density ratio model. The model also enables the use of a more efficient estimation method for the overall log hazard ratio in the Cox model. In addition, we propose testing procedures to evaluate two relevant hypotheses concerning mark-specific vaccine efficacy. The asymptotic properties and finite-sample performance of the inferential procedures are investigated. Finally, we apply the proposed methods to data collected in the Thai RV144 HIV vaccine efficacy trial.</p></div>
]]></content:encoded><description>
Summary In randomized placebo-controlled preventive HIV vaccine efficacy trials, an objective is to evaluate the relationship between vaccine efficacy to prevent infection and genetic distances of the exposing HIV strains to the multiple HIV sequences included in the vaccine construct, where the set of genetic distances is considered as the continuous multivariate “mark” observed in infected subjects only. This research develops a multivariate mark-specific hazard ratio model in the competing risks failure time analysis framework for the assessment of mark-specific vaccine efficacy. It allows improved efficiency of estimation by employing the semiparametric method of maximum profile likelihood estimation in the vaccine-to-placebo mark density ratio model. The model also enables the use of a more efficient estimation method for the overall log hazard ratio in the Cox model. In addition, we propose testing procedures to evaluate two relevant hypotheses concerning mark-specific vaccine efficacy. The asymptotic properties and finite-sample performance of the inferential procedures are investigated. Finally, we apply the proposed methods to data collected in the Thai RV144 HIV vaccine efficacy trial.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12017" xmlns="http://purl.org/rss/1.0/"><title>A Strategy for Bayesian Inference for Computationally Expensive Models with Application to the Estimation of Stem Cell Properties</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12017</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Strategy for Bayesian Inference for Computationally Expensive Models with Application to the Estimation of Stem Cell Properties</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Antony M. Overstall, David C. Woods</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-19T11:57:35.740276-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12017</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12017</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12017</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> Bayesian inference is considered for statistical models that depend on the evaluation of a computationally expensive computer code or simulator. For such situations, the number of evaluations of the likelihood function, and hence of the unnormalized posterior probability density function, is determined by the available computational resource and may be extremely limited. We present a new example of such a simulator that describes the properties of human embryonic stem cells using data from optical trapping experiments. This application is used to motivate a novel strategy for Bayesian inference which exploits a Gaussian process approximation of the simulator and allows computationally efficient Markov chain Monte Carlo inference. The advantages of this strategy over previous methodology are that it is less reliant on the determination of tuning parameters and allows the application of model diagnostic procedures that require no additional evaluations of the simulator. We show the advantages of our method on synthetic examples and demonstrate its application on stem cell experiments.</p></div>
]]></content:encoded><description>
Summary Bayesian inference is considered for statistical models that depend on the evaluation of a computationally expensive computer code or simulator. For such situations, the number of evaluations of the likelihood function, and hence of the unnormalized posterior probability density function, is determined by the available computational resource and may be extremely limited. We present a new example of such a simulator that describes the properties of human embryonic stem cells using data from optical trapping experiments. This application is used to motivate a novel strategy for Bayesian inference which exploits a Gaussian process approximation of the simulator and allows computationally efficient Markov chain Monte Carlo inference. The advantages of this strategy over previous methodology are that it is less reliant on the determination of tuning parameters and allows the application of model diagnostic procedures that require no additional evaluations of the simulator. We show the advantages of our method on synthetic examples and demonstrate its application on stem cell experiments.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12015" xmlns="http://purl.org/rss/1.0/"><title>Generalized Partially Linear Models for Incomplete Longitudinal Data In the Presence of Population-Level Information</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12015</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Generalized Partially Linear Models for Incomplete Longitudinal Data In the Presence of Population-Level Information</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Baojiang Chen, Xiao-Hua Zhou</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-16T08:35:22.225546-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12015</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12015</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12015</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> In observational studies, interest often lies in estimation of the population-level relationship between the explanatory variables and dependent variables, and the estimation is often done using longitudinal data. Longitudinal data often feature sampling error and bias due to nonrandom drop-out. However, inclusion of population-level information can increase estimation efficiency. In this article, we consider a generalized partially linear model for incomplete longitudinal data in the presence of the population-level information. A pseudo-empirical likelihood-based method is introduced to incorporate population-level information, and nonrandom drop-out bias is corrected by using a weighted generalized estimating equations method. A three-step estimation procedure is proposed, which makes the computation easier. Several methods that are often used in practice are compared in simulation studies, which demonstrate that our proposed method can correct the nonrandom drop-out bias and increase the estimation efficiency, especially for small sample size or when the missing proportion is high. We apply this method to an Alzheimer’s disease study.</p></div>
]]></content:encoded><description>
Summary In observational studies, interest often lies in estimation of the population-level relationship between the explanatory variables and dependent variables, and the estimation is often done using longitudinal data. Longitudinal data often feature sampling error and bias due to nonrandom drop-out. However, inclusion of population-level information can increase estimation efficiency. In this article, we consider a generalized partially linear model for incomplete longitudinal data in the presence of the population-level information. A pseudo-empirical likelihood-based method is introduced to incorporate population-level information, and nonrandom drop-out bias is corrected by using a weighted generalized estimating equations method. A three-step estimation procedure is proposed, which makes the computation easier. Several methods that are often used in practice are compared in simulation studies, which demonstrate that our proposed method can correct the nonrandom drop-out bias and increase the estimation efficiency, especially for small sample size or when the missing proportion is high. We apply this method to an Alzheimer’s disease study.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12013" xmlns="http://purl.org/rss/1.0/"><title>Outcome Vector Dependent Sampling with Longitudinal Continuous Response Data: Stratified Sampling Based on Summary Statistics</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12013</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Outcome Vector Dependent Sampling with Longitudinal Continuous Response Data: Stratified Sampling Based on Summary Statistics</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jonathan S. Schildcrout, Shawn P. Garbett, Patrick J. Heagerty</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T15:31:17.261845-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12013</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12013</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12013</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> The analysis of longitudinal trajectories usually focuses on evaluation of explanatory factors that are either associated with rates of change, or with overall mean levels of a continuous outcome variable. In this article, we introduce valid design and analysis methods that permit outcome dependent sampling of longitudinal data for scenarios where all outcome data currently exist, but a targeted substudy is being planned in order to collect additional key exposure information on a limited number of subjects. We propose a stratified sampling based on specific summaries of individual longitudinal trajectories, and we detail an ascertainment corrected maximum likelihood approach for estimation using the resulting biased sample of subjects. In addition, we demonstrate that the efficiency of an outcome-based sampling design relative to use of a simple random sample depends highly on the choice of outcome summary statistic used to direct sampling, and we show a natural link between the goals of the longitudinal regression model and corresponding desirable designs. Using data from the Childhood Asthma Management Program, where genetic information required retrospective ascertainment, we study a range of designs that examine lung function profiles over 4 years of follow-up for children classified according to their genotype for the IL 13 cytokine.</p></div>
]]></content:encoded><description>
Summary The analysis of longitudinal trajectories usually focuses on evaluation of explanatory factors that are either associated with rates of change, or with overall mean levels of a continuous outcome variable. In this article, we introduce valid design and analysis methods that permit outcome dependent sampling of longitudinal data for scenarios where all outcome data currently exist, but a targeted substudy is being planned in order to collect additional key exposure information on a limited number of subjects. We propose a stratified sampling based on specific summaries of individual longitudinal trajectories, and we detail an ascertainment corrected maximum likelihood approach for estimation using the resulting biased sample of subjects. In addition, we demonstrate that the efficiency of an outcome-based sampling design relative to use of a simple random sample depends highly on the choice of outcome summary statistic used to direct sampling, and we show a natural link between the goals of the longitudinal regression model and corresponding desirable designs. Using data from the Childhood Asthma Management Program, where genetic information required retrospective ascertainment, we study a range of designs that examine lung function profiles over 4 years of follow-up for children classified according to their genotype for the IL 13 cytokine.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12014" xmlns="http://purl.org/rss/1.0/"><title>Design and Estimation for Evaluating Principal Surrogate Markers in Vaccine Trials</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12014</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Design and Estimation for Evaluating Principal Surrogate Markers in Vaccine Trials</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ying Huang, Peter B. Gilbert, Julian Wolfson</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T14:48:02.937611-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12014</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12014</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12014</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> In vaccine research, immune biomarkers that can reliably predict a vaccine’s effect on the clinical endpoint (i.e., surrogate markers) are important tools for guiding vaccine development. This article addresses issues on optimizing two-phase sampling study design for evaluating surrogate markers in a principal surrogate framework, motivated by the design of a future HIV vaccine trial. To address the problem of missing potential outcomes in a standard trial design, novel trial designs have been proposed that utilize baseline predictors of the immune response biomarker(s) and/or augment the trial by vaccinating uninfected placebo recipients at the end of the trial and measuring their immune biomarkers. However, inefficient use of the augmented information can lead to counter-intuitive results on the precision of estimation. To remedy this problem, we propose a pseudo-score type estimator suitable for the augmented design and characterize its asymptotic properties. This estimator has superior performance compared with existing estimators and allows calculation of analytical variances useful for guiding study design. Based on the new estimator we investigate in detail the problem of optimizing the sampling scheme of a biomarker in a vaccine efficacy trial for efficiently estimating its surrogate effect, as characterized by the vaccine efficacy curve (a causal effect predictiveness curve) and by the predicted overall vaccine efficacy using the biomarker.</p></div>
]]></content:encoded><description>
Summary In vaccine research, immune biomarkers that can reliably predict a vaccine’s effect on the clinical endpoint (i.e., surrogate markers) are important tools for guiding vaccine development. This article addresses issues on optimizing two-phase sampling study design for evaluating surrogate markers in a principal surrogate framework, motivated by the design of a future HIV vaccine trial. To address the problem of missing potential outcomes in a standard trial design, novel trial designs have been proposed that utilize baseline predictors of the immune response biomarker(s) and/or augment the trial by vaccinating uninfected placebo recipients at the end of the trial and measuring their immune biomarkers. However, inefficient use of the augmented information can lead to counter-intuitive results on the precision of estimation. To remedy this problem, we propose a pseudo-score type estimator suitable for the augmented design and characterize its asymptotic properties. This estimator has superior performance compared with existing estimators and allows calculation of analytical variances useful for guiding study design. Based on the new estimator we investigate in detail the problem of optimizing the sampling scheme of a biomarker in a vaccine efficacy trial for efficiently estimating its surrogate effect, as characterized by the vaccine efficacy curve (a causal effect predictiveness curve) and by the predicted overall vaccine efficacy using the biomarker.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12008" xmlns="http://purl.org/rss/1.0/"><title>Distributed Lag Models for Hydrological Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12008</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Distributed Lag Models for Hydrological Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Alastair M. Rushworth, Adrian W. Bowman, Mark J. Brewer, Simon J. Langan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T14:46:31.153363-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12008</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12008</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12008</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> The distributed lag model (DLM), used most prominently in air pollution studies, finds application wherever the effect of a covariate is delayed and distributed through time. We specify modified formulations of DLMs to provide computationally attractive, flexible varying-coefficient models that are applicable in any setting in which lagged covariates are regressed on a time-dependent response. We investigate the application of such models to rainfall and river flow and in particular their role in understanding the impact of hidden variables at work in river systems. We apply two models to data from a Scottish mountain river, and we fit to some simulated data to check the efficacy of our model approach. During heavy rainfall conditions, changes in the influence of rainfall on flow arise through a complex interaction between antecedent ground wetness and a time-delay in rainfall. The models identify subtle changes in responsiveness to rainfall, particularly in the location of peak influence in the lag structure.</p></div>
]]></content:encoded><description>
Summary The distributed lag model (DLM), used most prominently in air pollution studies, finds application wherever the effect of a covariate is delayed and distributed through time. We specify modified formulations of DLMs to provide computationally attractive, flexible varying-coefficient models that are applicable in any setting in which lagged covariates are regressed on a time-dependent response. We investigate the application of such models to rainfall and river flow and in particular their role in understanding the impact of hidden variables at work in river systems. We apply two models to data from a Scottish mountain river, and we fit to some simulated data to check the efficacy of our model approach. During heavy rainfall conditions, changes in the influence of rainfall on flow arise through a complex interaction between antecedent ground wetness and a time-delay in rainfall. The models identify subtle changes in responsiveness to rainfall, particularly in the location of peak influence in the lag structure.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12011" xmlns="http://purl.org/rss/1.0/"><title>Recovering Gradients from Sparsely Observed Functional Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12011</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Recovering Gradients from Sparsely Observed Functional Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sara López-Pintado, Ian W. McKeague</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T13:39:28.268035-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12011</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12011</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12011</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> The recovery of gradients of sparsely observed functional data is a challenging ill-posed inverse problem. Given observations of smooth curves (e.g., growth curves) at isolated time points, the aim is to provide estimates of the underlying gradients (or growth velocities). To address this problem, we develop a Bayesian inversion approach that models the gradient in the gaps between the observation times by a tied-down Brownian motion, conditionally on its values at the observation times. The posterior mean and covariance kernel of the growth velocities are then found to have explicit and computationally tractable representations in terms of quadratic splines. The hyperparameters in the prior are specified via nonparametric empirical Bayes, with the prior precision matrix at the observation times estimated by constrained <span class="mathematics">ℓ<sub>1</sub></span> minimization. The infinitessimal variance of the Brownian motion prior is selected by cross-validation. The approach is illustrated using both simulated and real data examples.</p></div>
]]></content:encoded><description>
Summary The recovery of gradients of sparsely observed functional data is a challenging ill-posed inverse problem. Given observations of smooth curves (e.g., growth curves) at isolated time points, the aim is to provide estimates of the underlying gradients (or growth velocities). To address this problem, we develop a Bayesian inversion approach that models the gradient in the gaps between the observation times by a tied-down Brownian motion, conditionally on its values at the observation times. The posterior mean and covariance kernel of the growth velocities are then found to have explicit and computationally tractable representations in terms of quadratic splines. The hyperparameters in the prior are specified via nonparametric empirical Bayes, with the prior precision matrix at the observation times estimated by constrained ℓ1 minimization. The infinitessimal variance of the Brownian motion prior is selected by cross-validation. The approach is illustrated using both simulated and real data examples.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01475.x" xmlns="http://purl.org/rss/1.0/"><title>Rejoinder to “A Note on Type II Error Under Random Effects Misspecification in Generalized Linear Mixed Models”</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01475.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Rejoinder to “A Note on Type II Error Under Random Effects Misspecification in Generalized Linear Mixed Models”</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Saskia Litière, Ariel Alonso, Geert Molenberghs</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2010-08-19T12:52:48.217797-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2010.01475.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2010.01475.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01475.x</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b> In this rejoinder, we discuss the impact of misspecifying the random effects distribution on inferences obtained from generalized linear mixed models (GLMMs). Special attention is paid to the power of the tests for the fixed-effect parameters. To study this misspecification, researchers often use simulation designs in which several choices for the true underlying random-effects distribution are considered, while the assumed distribution is kept fixed. Neuhaus, McCulloch, and Boylan (2010, <em>Biometrics</em> <b>00</b>, 000–000) argue that a logically correct approach should consist of varying the assumed, fitted distribution, while holding the true fixed. We argue that both simulation designs can bring valuable insights into the impact of the misspecification. Furthermore, using both designs, we illustrate that the power associated with the tests for the fixed-effect parameters in GLMM may be affected by misspecifying the random-effects distribution.</p></div>]]></content:encoded><description>Summary In this rejoinder, we discuss the impact of misspecifying the random effects distribution on inferences obtained from generalized linear mixed models (GLMMs). Special attention is paid to the power of the tests for the fixed-effect parameters. To study this misspecification, researchers often use simulation designs in which several choices for the true underlying random-effects distribution are considered, while the assumed distribution is kept fixed. Neuhaus, McCulloch, and Boylan (2010, Biometrics 00, 000–000) argue that a logically correct approach should consist of varying the assumed, fitted distribution, while holding the true fixed. We argue that both simulation designs can bring valuable insights into the impact of the misspecification. Furthermore, using both designs, we illustrate that the power associated with the tests for the fixed-effect parameters in GLMM may be affected by misspecifying the random-effects distribution.</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01474.x" xmlns="http://purl.org/rss/1.0/"><title>A Note on Type II Error Under Random Effects Misspecification in Generalized Linear Mixed Models</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01474.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Note on Type II Error Under Random Effects Misspecification in Generalized Linear Mixed Models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">John M. Neuhaus, Charles E. McCulloch, Ross Boylan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2010-08-19T12:52:05.049825-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2010.01474.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2010.01474.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2010.01474.x</prism:url><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">no</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p><b><span class="smallCaps">Summary</span></b><a href="#b5" rel="references:#b5">Litière, Alonso, and Molenberghs</a> (2007, <em>Biometrics</em>, <b>63</b>, 1038–1044) presented the results of simulation studies that they claimed showed that misspecification of the shape of the random effects distribution can produce marked increases in Type II error (decreases in power) of tests based on fits of generalized linear mixed models. However, the article contains a logical fallacy that invalidates this claim. We present logically correct simulation studies that demonstrate little increase in Type II error, consistent with the earlier work that shows little effect due to misspecification.</p></div>]]></content:encoded><description>SummaryLitière, Alonso, and Molenberghs (2007, Biometrics, 63, 1038–1044) presented the results of simulation studies that they claimed showed that misspecification of the shape of the random effects distribution can produce marked increases in Type II error (decreases in power) of tests based on fits of generalized linear mixed models. However, the article contains a logical fallacy that invalidates this claim. We present logically correct simulation studies that demonstrate little increase in Type II error, consistent with the earlier work that shows little effect due to misspecification.</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.1824" xmlns="http://purl.org/rss/1.0/"><title>Report of the Editors—2012</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.1824</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Report of the Editors—2012</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-05T12:32:32.64833-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.1824</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.1824</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.1824</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Report of the Editors</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">vii</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">x</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[]]></content:encoded><description/></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01825.x" xmlns="http://purl.org/rss/1.0/"><title>Estimation of False Discovery Rate Using Sequential Permutation p-Values</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01825.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimation of False Discovery Rate Using Sequential Permutation p-Values</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Tim Bancroft, Chuanlong Du, Dan Nettleton</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T17:56:59.542649-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01825.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01825.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01825.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">7</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1825-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>We consider the problem of testing each of <em>m</em> null hypotheses with a sequential permutation procedure in which the number of draws from the permutation distribution of each test statistic is a random variable. Each sequential permutation <em>p</em>-value has a null distribution that is nonuniform on a discrete support. We show how to use a collection of such <em>p</em>-values to estimate the number of true null hypotheses <em>m</em><sub>0</sub> among the <em>m</em> null hypotheses tested and how to estimate the false discovery rate (FDR) associated with <em>p</em>-value significance thresholds. We use real data analyses and simulation studies to evaluate and illustrate the performance of our proposed approach relative to standard, more computationally intensive strategies. We find that our sequential approach produces similar results with far less computational expense in a variety of scenarios.</p></div></div>
]]></content:encoded><description>


We consider the problem of testing each of m null hypotheses with a sequential permutation procedure in which the number of draws from the permutation distribution of each test statistic is a random variable. Each sequential permutation p-value has a null distribution that is nonuniform on a discrete support. We show how to use a collection of such p-values to estimate the number of true null hypotheses m0 among the m null hypotheses tested and how to estimate the false discovery rate (FDR) associated with p-value significance thresholds. We use real data analyses and simulation studies to evaluate and illustrate the performance of our proposed approach relative to standard, more computationally intensive strategies. We find that our sequential approach produces similar results with far less computational expense in a variety of scenarios.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12003" xmlns="http://purl.org/rss/1.0/"><title>Gaussian Process-Based Bayesian Nonparametric Inference of Population Size Trajectories from Gene Genealogies</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12003</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Gaussian Process-Based Bayesian Nonparametric Inference of Population Size Trajectories from Gene Genealogies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Julia A. Palacios, Vladimir N. Minin</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T14:45:31.025247-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12003</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12003</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12003</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">8</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">18</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom12003-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Changes in population size influence genetic diversity of the population and, as a result, leave a signature of these changes in individual genomes in the population. We are interested in the inverse problem of reconstructing past population dynamics from genomic data. We start with a standard framework based on the coalescent, a stochastic process that generates genealogies connecting randomly sampled individuals from the population of interest. These genealogies serve as a glue between the population demographic history and genomic sequences. It turns out that only the times of genealogical lineage coalescences contain information about population size dynamics. Viewing these coalescent times as a point process, estimating population size trajectories is equivalent to estimating a conditional intensity of this point process. Therefore, our inverse problem is similar to estimating an inhomogeneous Poisson process intensity function. We demonstrate how recent advances in Gaussian process-based nonparametric inference for Poisson processes can be extended to Bayesian nonparametric estimation of population size dynamics under the coalescent. We compare our Gaussian process (GP) approach to one of the state-of-the-art Gaussian Markov random field (GMRF) methods for estimating population trajectories. Using simulated data, we demonstrate that our method has better accuracy and precision. Next, we analyze two genealogies reconstructed from real sequences of hepatitis C and human Influenza A viruses. In both cases, we recover more believed aspects of the viral demographic histories than the GMRF approach. We also find that our GP method produces more reasonable uncertainty estimates than the GMRF method.</p></div></div>
]]></content:encoded><description>


Changes in population size influence genetic diversity of the population and, as a result, leave a signature of these changes in individual genomes in the population. We are interested in the inverse problem of reconstructing past population dynamics from genomic data. We start with a standard framework based on the coalescent, a stochastic process that generates genealogies connecting randomly sampled individuals from the population of interest. These genealogies serve as a glue between the population demographic history and genomic sequences. It turns out that only the times of genealogical lineage coalescences contain information about population size dynamics. Viewing these coalescent times as a point process, estimating population size trajectories is equivalent to estimating a conditional intensity of this point process. Therefore, our inverse problem is similar to estimating an inhomogeneous Poisson process intensity function. We demonstrate how recent advances in Gaussian process-based nonparametric inference for Poisson processes can be extended to Bayesian nonparametric estimation of population size dynamics under the coalescent. We compare our Gaussian process (GP) approach to one of the state-of-the-art Gaussian Markov random field (GMRF) methods for estimating population trajectories. Using simulated data, we demonstrate that our method has better accuracy and precision. Next, we analyze two genealogies reconstructed from real sequences of hepatitis C and human Influenza A viruses. In both cases, we recover more believed aspects of the viral demographic histories than the GMRF approach. We also find that our GP method produces more reasonable uncertainty estimates than the GMRF method.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01832.x" xmlns="http://purl.org/rss/1.0/"><title>Hierarchical Factor Models for Large Spatially Misaligned Data: A Low-Rank Predictive Process Approach</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01832.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Hierarchical Factor Models for Large Spatially Misaligned Data: A Low-Rank Predictive Process Approach</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Qian Ren, Sudipto Banerjee</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T13:27:00.334619-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01832.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01832.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01832.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">19</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">30</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1832-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>This article deals with jointly modeling a large number of geographically referenced outcomes observed over a very large number of locations. We seek to capture associations among the variables as well as the strength of spatial association for each variable. In addition, we reckon with the common setting where not all the variables have been observed over all locations, which leads to <em>spatial misalignment</em>. Dimension reduction is needed in two aspects: (i) the length of the vector of outcomes, and (ii) the very large number of spatial locations. Latent variable (factor) models are usually used to address the former, although low-rank spatial processes offer a rich and flexible modeling option for dealing with a large number of locations. We merge these two ideas to propose a class of hierarchical low-rank spatial factor models. Our framework pursues stochastic selection of the latent factors without resorting to complex computational strategies (such as reversible jump algorithms) by utilizing certain identifiability characterizations for the spatial factor model. A Markov chain Monte Carlo algorithm is developed for estimation that also deals with the spatial misalignment problem. We recover the full posterior distribution of the missing values (along with model parameters) in a Bayesian predictive framework. Various additional modeling and implementation issues are discussed as well. We illustrate our methodology with simulation experiments and an environmental data set involving air pollutants in California.</p></div></div>
]]></content:encoded><description>


This article deals with jointly modeling a large number of geographically referenced outcomes observed over a very large number of locations. We seek to capture associations among the variables as well as the strength of spatial association for each variable. In addition, we reckon with the common setting where not all the variables have been observed over all locations, which leads to spatial misalignment. Dimension reduction is needed in two aspects: (i) the length of the vector of outcomes, and (ii) the very large number of spatial locations. Latent variable (factor) models are usually used to address the former, although low-rank spatial processes offer a rich and flexible modeling option for dealing with a large number of locations. We merge these two ideas to propose a class of hierarchical low-rank spatial factor models. Our framework pursues stochastic selection of the latent factors without resorting to complex computational strategies (such as reversible jump algorithms) by utilizing certain identifiability characterizations for the spatial factor model. A Markov chain Monte Carlo algorithm is developed for estimation that also deals with the spatial misalignment problem. We recover the full posterior distribution of the missing values (along with model parameters) in a Bayesian predictive framework. Various additional modeling and implementation issues are discussed as well. We illustrate our methodology with simulation experiments and an environmental data set involving air pollutants in California.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01828.x" xmlns="http://purl.org/rss/1.0/"><title>Wavelet-Based Clustering for Mixed-Effects Functional Models in High Dimension</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01828.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Wavelet-Based Clustering for Mixed-Effects Functional Models in High Dimension</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">M. Giacofci, S. Lambert-Lacroix, G. Marot, F. Picard</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T13:16:25.002266-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01828.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01828.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01828.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">31</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">40</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1828-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>We propose a method for high-dimensional curve clustering in the presence of interindividual variability. Curve clustering has longly been studied especially using splines to account for functional random effects. However, splines are not appropriate when dealing with high-dimensional data and can not be used to model irregular curves such as peak-like data. Our method is based on a wavelet decomposition of the signal for both fixed and random effects. We propose an efficient dimension reduction step based on wavelet thresholding adapted to multiple curves and using an appropriate structure for the random effect variance, we ensure that both fixed and random effects lie in the same functional space even when dealing with irregular functions that belong to Besov spaces. In the wavelet domain our model resumes to a linear mixed-effects model that can be used for a model-based clustering algorithm and for which we develop an EM-algorithm for maximum likelihood estimation. The properties of the overall procedure are validated by an extensive simulation study. Then, we illustrate our method on mass spectrometry data and we propose an original application of functional data analysis on microarray comparative genomic hybridization (CGH) data. Our procedure is available through the R package curvclust which is the first publicly available package that performs curve clustering with random effects in the high dimensional framework (available on the CRAN).</p></div></div>
]]></content:encoded><description>


We propose a method for high-dimensional curve clustering in the presence of interindividual variability. Curve clustering has longly been studied especially using splines to account for functional random effects. However, splines are not appropriate when dealing with high-dimensional data and can not be used to model irregular curves such as peak-like data. Our method is based on a wavelet decomposition of the signal for both fixed and random effects. We propose an efficient dimension reduction step based on wavelet thresholding adapted to multiple curves and using an appropriate structure for the random effect variance, we ensure that both fixed and random effects lie in the same functional space even when dealing with irregular functions that belong to Besov spaces. In the wavelet domain our model resumes to a linear mixed-effects model that can be used for a model-based clustering algorithm and for which we develop an EM-algorithm for maximum likelihood estimation. The properties of the overall procedure are validated by an extensive simulation study. Then, we illustrate our method on mass spectrometry data and we propose an original application of functional data analysis on microarray comparative genomic hybridization (CGH) data. Our procedure is available through the R package curvclust which is the first publicly available package that performs curve clustering with random effects in the high dimensional framework (available on the CRAN).
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01808.x" xmlns="http://purl.org/rss/1.0/"><title>Corrected Confidence Bands for Functional Data Using Principal Components</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01808.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Corrected Confidence Bands for Functional Data Using Principal Components</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">J. Goldsmith, S. Greven, C. Crainiceanu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T21:55:38.759973-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01808.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01808.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01808.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">41</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">51</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1808-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Functional principal components (FPC) analysis is widely used to decompose and express functional observations. Curve estimates implicitly condition on basis functions and other quantities derived from FPC decompositions; however these objects are unknown in practice. In this article, we propose a method for obtaining correct curve estimates by accounting for uncertainty in FPC decompositions. Additionally, pointwise and simultaneous confidence intervals that account for both model- and decomposition-based variability are constructed. Standard mixed model representations of functional expansions are used to construct curve estimates and variances conditional on a specific decomposition. Iterated expectation and variance formulas combine model-based conditional estimates across the distribution of decompositions. A bootstrap procedure is implemented to understand the uncertainty in principal component decomposition quantities. Our method compares favorably to competing approaches in simulation studies that include both densely and sparsely observed functions. We apply our method to sparse observations of CD4 cell counts and to dense white-matter tract profiles. Code for the analyses and simulations is publicly available, and our method is implemented in the R package refund on CRAN.</p></div></div>
]]></content:encoded><description>


Functional principal components (FPC) analysis is widely used to decompose and express functional observations. Curve estimates implicitly condition on basis functions and other quantities derived from FPC decompositions; however these objects are unknown in practice. In this article, we propose a method for obtaining correct curve estimates by accounting for uncertainty in FPC decompositions. Additionally, pointwise and simultaneous confidence intervals that account for both model- and decomposition-based variability are constructed. Standard mixed model representations of functional expansions are used to construct curve estimates and variances conditional on a specific decomposition. Iterated expectation and variance formulas combine model-based conditional estimates across the distribution of decompositions. A bootstrap procedure is implemented to understand the uncertainty in principal component decomposition quantities. Our method compares favorably to competing approaches in simulation studies that include both densely and sparsely observed functions. We apply our method to sparse observations of CD4 cell counts and to dense white-matter tract profiles. Code for the analyses and simulations is publicly available, and our method is implemented in the R package refund on CRAN.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01818.x" xmlns="http://purl.org/rss/1.0/"><title>Latent Subgroup Analysis of a Randomized Clinical Trial through a Semiparametric Accelerated Failure Time Mixture Model</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01818.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Latent Subgroup Analysis of a Randomized Clinical Trial through a Semiparametric Accelerated Failure Time Mixture Model</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">L. Altstein, G. Li</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-05T14:55:27.591396-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01818.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01818.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01818.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">52</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">61</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1818-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>This article studies a semiparametric accelerated failure time mixture model for estimation of a biological treatment effect on a latent subgroup of interest with a time-to-event outcome in randomized clinical trials. Latency is induced because membership is observable in one arm of the trial and unidentified in the other. This method is useful in randomized clinical trials with all-or-none noncompliance when patients in the control arm have no access to active treatment and in, for example, oncology trials when a biopsy used to identify the latent subgroup is performed only on subjects randomized to active treatment. We derive a computational method to estimate model parameters by iterating between an expectation step and a weighted Buckley–James optimization step. The bootstrap method is used for variance estimation, and the performance of our method is corroborated in simulation. We illustrate our method through an analysis of a multicenter selective lymphadenectomy trial for melanoma.</p></div></div>
]]></content:encoded><description>


This article studies a semiparametric accelerated failure time mixture model for estimation of a biological treatment effect on a latent subgroup of interest with a time-to-event outcome in randomized clinical trials. Latency is induced because membership is observable in one arm of the trial and unidentified in the other. This method is useful in randomized clinical trials with all-or-none noncompliance when patients in the control arm have no access to active treatment and in, for example, oncology trials when a biopsy used to identify the latent subgroup is performed only on subjects randomized to active treatment. We derive a computational method to estimate model parameters by iterating between an expectation step and a weighted Buckley–James optimization step. The bootstrap method is used for variance estimation, and the performance of our method is corroborated in simulation. We illustrate our method through an analysis of a multicenter selective lymphadenectomy trial for melanoma.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01822.x" xmlns="http://purl.org/rss/1.0/"><title>A Risk-Adjusted O–E CUSUM with Monitoring Bands for Monitoring Medical Outcomes</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01822.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Risk-Adjusted O–E CUSUM with Monitoring Bands for Monitoring Medical Outcomes</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Rena Jie Sun, John D. Kalbfleisch</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-05T14:43:26.306499-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01822.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01822.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01822.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">62</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">69</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1822-sec-1001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>In order to monitor a medical center's survival outcomes using simple plots, we introduce a risk-adjusted Observed–Expected (O–E) Cumulative SUM (CUSUM) along with monitoring bands as decision criterion.The proposed monitoring bands can be used in place of a more traditional but complicated V-shaped mask or the simultaneous use of two one-sided CUSUMs. The resulting plot is designed to simultaneously monitor for failure time outcomes that are “worse than expected” or “better than expected.” The slopes of the O–E CUSUM provide direct estimates of the relative risk (as compared to a standard or expected failure rate) for the data being monitored. Appropriate rejection regions are obtained by controlling the false alarm rate (type I error) over a period of given length. Simulation studies are conducted to illustrate the performance of the proposed method. A case study is carried out for 58 liver transplant centers. The use of CUSUM methods for quality improvement is stressed.</p></div></div>
]]></content:encoded><description>


In order to monitor a medical center's survival outcomes using simple plots, we introduce a risk-adjusted Observed–Expected (O–E) Cumulative SUM (CUSUM) along with monitoring bands as decision criterion.The proposed monitoring bands can be used in place of a more traditional but complicated V-shaped mask or the simultaneous use of two one-sided CUSUMs. The resulting plot is designed to simultaneously monitor for failure time outcomes that are “worse than expected” or “better than expected.” The slopes of the O–E CUSUM provide direct estimates of the relative risk (as compared to a standard or expected failure rate) for the data being monitored. Appropriate rejection regions are obtained by controlling the false alarm rate (type I error) over a period of given length. Simulation studies are conducted to illustrate the performance of the proposed method. A case study is carried out for 58 liver transplant centers. The use of CUSUM methods for quality improvement is stressed.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01810.x" xmlns="http://purl.org/rss/1.0/"><title>Factor Selection and Structural Identification in the Interaction ANOVA Model</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01810.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Factor Selection and Structural Identification in the Interaction ANOVA Model</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Justin B. Post, Howard D. Bondell</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-01-17T05:06:35.727793-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01810.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01810.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01810.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">70</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">79</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1810-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>When faced with categorical predictors and a continuous response, the objective of an analysis often consists of two tasks: finding which factors are important and determining which levels of the factors differ significantly from one another. Often times, these tasks are done separately using Analysis of Variance (ANOVA) followed by a post hoc hypothesis testing procedure such as Tukey's Honestly Significant Difference test. When interactions between factors are included in the model the collapsing of levels of a factor becomes a more difficult problem. When testing for differences between two levels of a factor, claiming no difference would refer not only to equality of main effects, but also to equality of each interaction involving those levels. This structure between the main effects and interactions in a model is similar to the idea of heredity used in regression models. This article introduces a new method for accomplishing both of the common analysis tasks simultaneously in an interaction model while also adhering to the heredity-type constraint on the model. An appropriate penalization is constructed that encourages levels of factors to collapse and entire factors to be set to zero. It is shown that the procedure has the oracle property implying that asymptotically it performs as well as if the exact structure were known beforehand. We also discuss the application to estimating interactions in the unreplicated case. Simulation studies show the procedure outperforms post hoc hypothesis testing procedures as well as similar methods that do not include a structural constraint. The method is also illustrated using a real data example.</p></div></div>
]]></content:encoded><description>


When faced with categorical predictors and a continuous response, the objective of an analysis often consists of two tasks: finding which factors are important and determining which levels of the factors differ significantly from one another. Often times, these tasks are done separately using Analysis of Variance (ANOVA) followed by a post hoc hypothesis testing procedure such as Tukey's Honestly Significant Difference test. When interactions between factors are included in the model the collapsing of levels of a factor becomes a more difficult problem. When testing for differences between two levels of a factor, claiming no difference would refer not only to equality of main effects, but also to equality of each interaction involving those levels. This structure between the main effects and interactions in a model is similar to the idea of heredity used in regression models. This article introduces a new method for accomplishing both of the common analysis tasks simultaneously in an interaction model while also adhering to the heredity-type constraint on the model. An appropriate penalization is constructed that encourages levels of factors to collapse and entire factors to be set to zero. It is shown that the procedure has the oracle property implying that asymptotically it performs as well as if the exact structure were known beforehand. We also discuss the application to estimating interactions in the unreplicated case. Simulation studies show the procedure outperforms post hoc hypothesis testing procedures as well as similar methods that do not include a structural constraint. The method is also illustrated using a real data example.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01833.x" xmlns="http://purl.org/rss/1.0/"><title>A Regularization Corrected Score Method for Nonlinear Regression Models with Covariate Error</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01833.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Regularization Corrected Score Method for Nonlinear Regression Models with Covariate Error</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">David M. Zucker, Malka Gorfine, Yi Li, Mahlet G. Tadesse, Donna Spiegelman</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T11:35:27.093756-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01833.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01833.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01833.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">80</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">90</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1833-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Many regression analyses involve explanatory variables that are measured with error, and failing to account for this error is well known to lead to biased point and interval estimates of the regression coefficients. We present here a new general method for adjusting for covariate error. Our method consists of an approximate version of the Stefanski–Nakamura corrected score approach, using the method of regularization to obtain an approximate solution of the relevant integral equation. We develop the theory in the setting of classical likelihood models; this setting covers, for example, linear regression, nonlinear regression, logistic regression, and Poisson regression. The method is extremely general in terms of the types of measurement error models covered, and is a functional method in the sense of not involving assumptions on the distribution of the true covariate. We discuss the theoretical properties of the method and present simulation results in the logistic regression setting (univariate and multivariate). For illustration, we apply the method to data from the Harvard Nurses' Health Study concerning the relationship between physical activity and breast cancer mortality in the period following a diagnosis of breast cancer.</p></div></div>
]]></content:encoded><description>


Many regression analyses involve explanatory variables that are measured with error, and failing to account for this error is well known to lead to biased point and interval estimates of the regression coefficients. We present here a new general method for adjusting for covariate error. Our method consists of an approximate version of the Stefanski–Nakamura corrected score approach, using the method of regularization to obtain an approximate solution of the relevant integral equation. We develop the theory in the setting of classical likelihood models; this setting covers, for example, linear regression, nonlinear regression, logistic regression, and Poisson regression. The method is extremely general in terms of the types of measurement error models covered, and is a functional method in the sense of not involving assumptions on the distribution of the true covariate. We discuss the theoretical properties of the method and present simulation results in the logistic regression setting (univariate and multivariate). For illustration, we apply the method to data from the Harvard Nurses' Health Study concerning the relationship between physical activity and breast cancer mortality in the period following a diagnosis of breast cancer.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12001" xmlns="http://purl.org/rss/1.0/"><title>Covariate Adjustment in Estimating the Area Under ROC Curve with Partially Missing Gold Standard</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12001</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Covariate Adjustment in Estimating the Area Under ROC Curve with Partially Missing Gold Standard</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Danping Liu, Xiao-Hua Zhou</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T13:27:05.271814-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12001</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12001</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12001</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">91</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">100</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom12001-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>In ROC analysis, covariate adjustment is advocated when the covariates impact the magnitude or accuracy of the test under study. Meanwhile, for many large scale screening tests, the true condition status may be subject to missingness because it is expensive and/or invasive to ascertain the disease status. The complete-case analysis may end up with a biased inference, also known as “verification bias.” To address the issue of covariate adjustment with verification bias in ROC analysis, we propose several estimators for the area under the covariate-specific and covariate-adjusted ROC curves (AUC<sub><em>x</em></sub> and AAUC). The AUC<sub><em>x</em></sub> is directly modeled in the form of binary regression, and the estimating equations are based on the U statistics. The AAUC is estimated from the weighted average of AUC<sub><em>x</em></sub> over the covariate distribution of the diseased subjects. We employ reweighting and imputation techniques to overcome the verification bias problem. Our proposed estimators are initially derived assuming that the true disease status is missing at random (MAR), and then with some modification, the estimators can be extended to the not missing at random (NMAR) situation. The asymptotic distributions are derived for the proposed estimators. The finite sample performance is evaluated by a series of simulation studies. Our method is applied to a data set in Alzheimer's disease research.</p></div></div>
]]></content:encoded><description>


In ROC analysis, covariate adjustment is advocated when the covariates impact the magnitude or accuracy of the test under study. Meanwhile, for many large scale screening tests, the true condition status may be subject to missingness because it is expensive and/or invasive to ascertain the disease status. The complete-case analysis may end up with a biased inference, also known as “verification bias.” To address the issue of covariate adjustment with verification bias in ROC analysis, we propose several estimators for the area under the covariate-specific and covariate-adjusted ROC curves (AUCx and AAUC). The AUCx is directly modeled in the form of binary regression, and the estimating equations are based on the U statistics. The AAUC is estimated from the weighted average of AUCx over the covariate distribution of the diseased subjects. We employ reweighting and imputation techniques to overcome the verification bias problem. Our proposed estimators are initially derived assuming that the true disease status is missing at random (MAR), and then with some modification, the estimators can be extended to the not missing at random (NMAR) situation. The asymptotic distributions are derived for the proposed estimators. The finite sample performance is evaluated by a series of simulation studies. Our method is applied to a data set in Alzheimer's disease research.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01809.x" xmlns="http://purl.org/rss/1.0/"><title>A Path-Specific SEIR Model for use with General Latent and Infectious Time Distributions</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01809.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Path-Specific SEIR Model for use with General Latent and Infectious Time Distributions</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Aaron T. Porter, Jacob J. Oleson</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-01-16T14:12:24.211771-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01809.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01809.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01809.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">101</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">108</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1809-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Most current Bayesian SEIR (Susceptible, Exposed, Infectious, Removed (or Recovered)) models either use exponentially distributed latent and infectious periods, allow for a single distribution on the latent and infectious period, or make strong assumptions regarding the quantity of information available regarding time distributions, particularly the time spent in the exposed compartment. Many infectious diseases require a more realistic assumption on the latent and infectious periods. In this article, we provide an alternative model allowing general distributions to be utilized for both the exposed and infectious compartments, while avoiding the need for full latent time data. The alternative formulation is a path-specific SEIR (PS SEIR) model that follows individual paths through the exposed and infectious compartments, thereby removing the need for an exponential assumption on the latent and infectious time distributions. We show how the PS SEIR model is a stochastic analog to a general class of deterministic SEIR models. We then demonstrate the improvement of this PS SEIR model over more common population averaged models via simulation results and perform a new analysis of the Iowa mumps epidemic from 2006.</p></div></div>
]]></content:encoded><description>


Most current Bayesian SEIR (Susceptible, Exposed, Infectious, Removed (or Recovered)) models either use exponentially distributed latent and infectious periods, allow for a single distribution on the latent and infectious period, or make strong assumptions regarding the quantity of information available regarding time distributions, particularly the time spent in the exposed compartment. Many infectious diseases require a more realistic assumption on the latent and infectious periods. In this article, we provide an alternative model allowing general distributions to be utilized for both the exposed and infectious compartments, while avoiding the need for full latent time data. The alternative formulation is a path-specific SEIR (PS SEIR) model that follows individual paths through the exposed and infectious compartments, thereby removing the need for an exponential assumption on the latent and infectious time distributions. We show how the PS SEIR model is a stochastic analog to a general class of deterministic SEIR models. We then demonstrate the improvement of this PS SEIR model over more common population averaged models via simulation results and perform a new analysis of the Iowa mumps epidemic from 2006.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01827.x" xmlns="http://purl.org/rss/1.0/"><title>Prevalence Projections of Chronic Diseases and Impact of Public Health Intervention</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01827.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Prevalence Projections of Chronic Diseases and Impact of Public Health Intervention</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Pierre Joly, Célia Touraine, Aurore Georget, Jean-François Dartigues, Daniel Commenges, Hélène Jacqmin-Gadda</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T13:20:21.773449-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01827.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01827.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01827.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">109</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">117</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1827-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>The estimation of future prevalences of chronic diseases is essential for public health policy. Using incidence estimates from cohort data and demographic projections for general mortality and population sizes, we propose a method based on a general illness–death model to make prevalence projections for chronic diseases. In contrast to previously published methods, we account for differences between global mortality and mortality of healthy subjects and compare two assumptions regarding the secular trend for mortality of diseased subjects. Then we develop a methodology to estimate changes in future disease prevalences resulting from prevention campaign to reduce the frequency or the excess risk associated with a risk factor. The methods are applied for estimating dementia prevalence in France between 2010 and 2030.</p></div></div>
]]></content:encoded><description>


The estimation of future prevalences of chronic diseases is essential for public health policy. Using incidence estimates from cohort data and demographic projections for general mortality and population sizes, we propose a method based on a general illness–death model to make prevalence projections for chronic diseases. In contrast to previously published methods, we account for differences between global mortality and mortality of healthy subjects and compare two assumptions regarding the secular trend for mortality of diseased subjects. Then we develop a methodology to estimate changes in future disease prevalences resulting from prevention campaign to reduce the frequency or the excess risk associated with a risk factor. The methods are applied for estimating dementia prevalence in France between 2010 and 2030.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01821.x" xmlns="http://purl.org/rss/1.0/"><title>Impact of Multiple Matched Controls on Design Sensitivity in Observational Studies</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01821.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Impact of Multiple Matched Controls on Design Sensitivity in Observational Studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Paul R. Rosenbaum</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T17:59:11.694405-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01821.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01821.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01821.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">118</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">127</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1821-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>In an observational study, one treated subject may be matched for observed covariates to either one or several untreated controls. The common motivation for using several controls rather than one is to increase the power of a test of no effect under the doubtful assumption that matching for observed covariates suffices to remove bias from nonrandom treatment assignment. Does the choice between one or several matched controls affect the sensitivity of conclusions to violations of this doubtful assumption? With continuous responses, it is known that reducing the heterogeneity of matched pair differences reduces sensitivity to unmeasured biases, but increasing the sample size has a highly circumscribed effect on sensitivity to bias. Is the use of several controls rather than one analogous to a reduction in heterogeneity or to an increase in sample size? The issue is examined for Huber's <em>m</em>-statistics, including the <em>t</em>-test, the examination having three components: an example, asymptotic calculations using design sensitivity, and a simulation. Use of multiple controls with continuous responses yields a nontrivial reduction in sensitivity to unmeasured biases. An example looks at lead and cadmium in the blood of smokers from the 2008 National Health and Nutrition Examination Survey. A by-product of the discussion is a new result giving the design sensitivity for the permutation distribution of <em>m</em>-statistics.</p></div></div>
]]></content:encoded><description>


In an observational study, one treated subject may be matched for observed covariates to either one or several untreated controls. The common motivation for using several controls rather than one is to increase the power of a test of no effect under the doubtful assumption that matching for observed covariates suffices to remove bias from nonrandom treatment assignment. Does the choice between one or several matched controls affect the sensitivity of conclusions to violations of this doubtful assumption? With continuous responses, it is known that reducing the heterogeneity of matched pair differences reduces sensitivity to unmeasured biases, but increasing the sample size has a highly circumscribed effect on sensitivity to bias. Is the use of several controls rather than one analogous to a reduction in heterogeneity or to an increase in sample size? The issue is examined for Huber's m-statistics, including the t-test, the examination having three components: an example, asymptotic calculations using design sensitivity, and a simulation. Use of multiple controls with continuous responses yields a nontrivial reduction in sensitivity to unmeasured biases. An example looks at lead and cadmium in the blood of smokers from the 2008 National Health and Nutrition Examination Survey. A by-product of the discussion is a new result giving the design sensitivity for the permutation distribution of m-statistics.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01795.x" xmlns="http://purl.org/rss/1.0/"><title>A Positive Event Dependence Model for Self-Controlled Case Series with Applications in Postmarketing Surveillance</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01795.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Positive Event Dependence Model for Self-Controlled Case Series with Applications in Postmarketing Surveillance</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Shawn E. Simpson</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T16:38:20.288315-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01795.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01795.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01795.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">128</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">136</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1795-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>A primary objective in the application of postmarketing drug safety surveillance is to ascertain the relationship between time-varying drug exposures and recurrent adverse events (AEs) related to health outcomes. The self-controlled case series (SCCS) method is one approach to analysis in this context. It is based on a conditional Poisson regression model, which assumes that events at different time points are conditionally independent given the covariate process. This requirement is problematic when the occurrence of an event can alter the future event risk. In a clinical setting, for example, patients who have a first myocardial infarction (MI) may be at higher subsequent risk for a second. In this work, we propose the <em>positive dependence self-controlled case series</em> (PD-SCCS) method: a generalization of SCCS that allows the occurrence of an event to increase the future event risk, yet maintains the advantages of the original model by controlling for fixed baseline covariates and relying solely on data from cases. As in the SCCS model, individual-level baseline parameters drop out of the PD-SCCS likelihood. Data sources used for postmarketing surveillance can contain tens of millions of people, so in this situation it is particularly advantageous that PD-SCCS avoids doing a costly estimation of individual parameters. We develop expressions for large sample inference and optimization for PD-SCCS and compare the results of our generalized model with the more restrictive SCCS approach.</p></div></div>
]]></content:encoded><description>


A primary objective in the application of postmarketing drug safety surveillance is to ascertain the relationship between time-varying drug exposures and recurrent adverse events (AEs) related to health outcomes. The self-controlled case series (SCCS) method is one approach to analysis in this context. It is based on a conditional Poisson regression model, which assumes that events at different time points are conditionally independent given the covariate process. This requirement is problematic when the occurrence of an event can alter the future event risk. In a clinical setting, for example, patients who have a first myocardial infarction (MI) may be at higher subsequent risk for a second. In this work, we propose the positive dependence self-controlled case series (PD-SCCS) method: a generalization of SCCS that allows the occurrence of an event to increase the future event risk, yet maintains the advantages of the original model by controlling for fixed baseline covariates and relying solely on data from cases. As in the SCCS model, individual-level baseline parameters drop out of the PD-SCCS likelihood. Data sources used for postmarketing surveillance can contain tens of millions of people, so in this situation it is particularly advantageous that PD-SCCS avoids doing a costly estimation of individual parameters. We develop expressions for large sample inference and optimization for PD-SCCS and compare the results of our generalized model with the more restrictive SCCS approach.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01797.x" xmlns="http://purl.org/rss/1.0/"><title>Testing for Homogeneity of Multivariate Dispersions Using Dissimilarity Measures</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01797.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Testing for Homogeneity of Multivariate Dispersions Using Dissimilarity Measures</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Irène Gijbels, Marek Omelka</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T22:05:30.62415-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01797.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01797.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01797.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">137</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">145</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1797-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Testing homogeneity of dispersions may be of its own scientific interest as well as an important auxiliary step verifying assumptions of a main analysis. The problem is that many biological and ecological data are highly skewed and zero-inflated. Also the number of variables often exceeds the sample size. Thus data analysts often do not rely on parametric assumptions, but use a particular dissimilarity measure to calculate a matrix of pairwise differences. This matrix is then the basis for further statistical inference. Anderson (2006) proposed a distance-based test of homogeneity of multivariate dispersions for a one-way ANOVA design, for which a matrix of pairwise dissimilarities can be taken as an input. The key idea, like in Levene's test, is to replace each observation with its distance to an estimated group center. In this paper we suggest an alternative approach that is based on the means of within-group distances and does not require group centre calculations to obtain the test statistic. We show that this approach can have theoretical as well as practical advantages. A permutation procedure that gives type I error close to the prescribed value even in small samples is described.</p></div></div>
]]></content:encoded><description>


Testing homogeneity of dispersions may be of its own scientific interest as well as an important auxiliary step verifying assumptions of a main analysis. The problem is that many biological and ecological data are highly skewed and zero-inflated. Also the number of variables often exceeds the sample size. Thus data analysts often do not rely on parametric assumptions, but use a particular dissimilarity measure to calculate a matrix of pairwise differences. This matrix is then the basis for further statistical inference. Anderson (2006) proposed a distance-based test of homogeneity of multivariate dispersions for a one-way ANOVA design, for which a matrix of pairwise dissimilarities can be taken as an input. The key idea, like in Levene's test, is to replace each observation with its distance to an estimated group center. In this paper we suggest an alternative approach that is based on the means of within-group distances and does not require group centre calculations to obtain the test statistic. We show that this approach can have theoretical as well as practical advantages. A permutation procedure that gives type I error close to the prescribed value even in small samples is described.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01796.x" xmlns="http://purl.org/rss/1.0/"><title>Estimating Open Population Site Occupancy from Presence–Absence Data Lacking the Robust Design</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01796.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating Open Population Site Occupancy from Presence–Absence Data Lacking the Robust Design</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">D. Dail, L. Madsen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T22:05:26.439954-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01796.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01796.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01796.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">146</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">156</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1796-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Many animal monitoring studies seek to estimate the proportion of a study area occupied by a target population. The study area is divided into spatially distinct sites where the detected presence or absence of the population is recorded, and this is repeated in time for multiple seasons. However, when occupied sites are detected with probability <em>p</em> &lt; 1, the lack of a detection does not imply lack of occupancy. MacKenzie et al. (2003, <em>Ecology</em> <b>84</b>, 2200–2207) developed a multiseason model for estimating seasonal site occupancy (ψ<sub><em>t</em></sub>) while accounting for unknown <em>p</em>. Their model performs well when observations are collected according to the robust design, where multiple sampling occasions occur during each season; the repeated sampling aids in the estimation <em>p</em>. However, their model does not perform as well when the robust design is lacking. In this paper, we propose an alternative likelihood model that yields improved seasonal estimates of <em>p</em> and Ψ<sub><em>t</em></sub> in the absence of the robust design. We construct the marginal likelihood of the observed data by conditioning on, and summing out, the latent number of occupied sites during each season. A simulation study shows that in cases without the robust design, the proposed model estimates <em>p</em> with less bias than the MacKenzie et al. model and hence improves the estimates of Ψ<sub><em>t</em></sub>. We apply both models to a data set consisting of repeated presence–absence observations of American robins (<em>Turdus migratorius</em>) with yearly survey periods. The two models are compared to a third estimator available when the repeated counts (from the same study) are considered, with the proposed model yielding estimates of Ψ<sub><em>t</em></sub> closest to estimates from the point count model.</p></div></div>
]]></content:encoded><description>


Many animal monitoring studies seek to estimate the proportion of a study area occupied by a target population. The study area is divided into spatially distinct sites where the detected presence or absence of the population is recorded, and this is repeated in time for multiple seasons. However, when occupied sites are detected with probability p &lt; 1, the lack of a detection does not imply lack of occupancy. MacKenzie et al. (2003, Ecology 84, 2200–2207) developed a multiseason model for estimating seasonal site occupancy (ψt) while accounting for unknown p. Their model performs well when observations are collected according to the robust design, where multiple sampling occasions occur during each season; the repeated sampling aids in the estimation p. However, their model does not perform as well when the robust design is lacking. In this paper, we propose an alternative likelihood model that yields improved seasonal estimates of p and Ψt in the absence of the robust design. We construct the marginal likelihood of the observed data by conditioning on, and summing out, the latent number of occupied sites during each season. A simulation study shows that in cases without the robust design, the proposed model estimates p with less bias than the MacKenzie et al. model and hence improves the estimates of Ψt. We apply both models to a data set consisting of repeated presence–absence observations of American robins (Turdus migratorius) with yearly survey periods. The two models are compared to a third estimator available when the repeated counts (from the same study) are considered, with the proposed model yielding estimates of Ψt closest to estimates from the point count model.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01806.x" xmlns="http://purl.org/rss/1.0/"><title>Bayesian Hypothesis Testing in Two-Arm Trials with Dichotomous Outcomes</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01806.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian Hypothesis Testing in Two-Arm Trials with Dichotomous Outcomes</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Boris G. Zaslavsky</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T22:06:53.994322-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01806.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01806.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01806.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">157</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">163</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1806-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>This article is motivated by an interest in comparing inferences made when using a Bayesian or frequentist statistical approach. The article addresses the study of one-sided superiority and noninferiority Bayesian tests. These tests are stated in terms of the posterior probability that the null hypothesis is true for the binomial distribution and in terms of one-sided credible limits. We restrict our considerations to conjugate beta priors with integer parameters. Under this assumption, the posterior probabilities of tested hypotheses can be transformed into the frequentist probabilities of Bernoulli trials with an adjusted number of events and population sizes. The method resembles a standard frequentist problem formulation. By using an appropriate choice of prior parameters, the posterior probabilities of the null hypothesis can be made smaller or larger than the <em>p</em>-values of frequentist tests.</p></div></div>
]]></content:encoded><description>


This article is motivated by an interest in comparing inferences made when using a Bayesian or frequentist statistical approach. The article addresses the study of one-sided superiority and noninferiority Bayesian tests. These tests are stated in terms of the posterior probability that the null hypothesis is true for the binomial distribution and in terms of one-sided credible limits. We restrict our considerations to conjugate beta priors with integer parameters. Under this assumption, the posterior probabilities of tested hypotheses can be transformed into the frequentist probabilities of Bernoulli trials with an adjusted number of events and population sizes. The method resembles a standard frequentist problem formulation. By using an appropriate choice of prior parameters, the posterior probabilities of the null hypothesis can be made smaller or larger than the p-values of frequentist tests.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12004" xmlns="http://purl.org/rss/1.0/"><title>A Novel Bayesian Semiparametric Algorithm for Inferring Population Structure and Adjusting for Case-Control Association Tests</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12004</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Novel Bayesian Semiparametric Algorithm for Inferring Population Structure and Adjusting for Case-Control Association Tests</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Arunabha Majumdar, Sourabh Bhattacharya, Analabha Basu, Saurabh Ghosh</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-21T12:36:36.308672-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12004</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12004</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12004</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">164</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">173</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom12004-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>While the population-based case-control approach is the popular study design for association mapping of complex genetic traits because of ease of data collection and statistical analyses, it suffers from the inherent problem of population stratification. There have been methodological developments for adjusting these studies for population substructure, but efficient estimation of the number of subpopulations (<em>K</em>), which has evolutionary significance, remains a statistical challenge. In this article, we propose a Bayesian semiparametric approach to estimate population substructure under the assumption that <em>K</em> is random. Using extensive simulations, we find that our proposed method is not only computationally much faster than an existing Bayesian approach <em>Structure</em>, but also estimates the number of subpopulations more accurately, and thus, yields more power in detecting association in case-control studies.</p></div></div>
]]></content:encoded><description>


While the population-based case-control approach is the popular study design for association mapping of complex genetic traits because of ease of data collection and statistical analyses, it suffers from the inherent problem of population stratification. There have been methodological developments for adjusting these studies for population substructure, but efficient estimation of the number of subpopulations (K), which has evolutionary significance, remains a statistical challenge. In this article, we propose a Bayesian semiparametric approach to estimate population substructure under the assumption that K is random. Using extensive simulations, we find that our proposed method is not only computationally much faster than an existing Bayesian approach Structure, but also estimates the number of subpopulations more accurately, and thus, yields more power in detecting association in case-control studies.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01817.x" xmlns="http://purl.org/rss/1.0/"><title>Semiparametric Bayesian Inference for Phage Display Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01817.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Semiparametric Bayesian Inference for Phage Display Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Luis G. León-Novelo, Peter Müller, Wadih Arap, Mikhail Kolonin, Jessica Sun, Renata Pasqualini, Kim-Anh Do</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-01-22T17:25:47.04062-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01817.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01817.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01817.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">174</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">183</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1817-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>We discuss inference for a human phage display experiment with three stages. The data are tripeptide counts by tissue and stage. The primary aim of the experiment is to identify ligands that bind with high affinity to a given tissue. We formalize the research question as inference about the monotonicity of mean counts over stages. The inference goal is then to identify a list of peptide–tissue pairs with significant increase over stages. We use a semiparametric Dirichlet process mixture of Poisson model. The posterior distribution under this model allows the desired inference about the monotonicity of mean counts. However, the desired inference summary as a list of peptide–tissue pairs with significant increase involves a massive multiplicity problem. We consider two alternative approaches to address this multiplicity issue. First we propose an approach based on the control of the posterior expected false discovery rate. We notice that the implied solution ignores the relative size of the increase. This motivates a second approach based on a utility function that includes explicit weights for the size of the increase.</p></div></div>
]]></content:encoded><description>


We discuss inference for a human phage display experiment with three stages. The data are tripeptide counts by tissue and stage. The primary aim of the experiment is to identify ligands that bind with high affinity to a given tissue. We formalize the research question as inference about the monotonicity of mean counts over stages. The inference goal is then to identify a list of peptide–tissue pairs with significant increase over stages. We use a semiparametric Dirichlet process mixture of Poisson model. The posterior distribution under this model allows the desired inference about the monotonicity of mean counts. However, the desired inference summary as a list of peptide–tissue pairs with significant increase involves a massive multiplicity problem. We consider two alternative approaches to address this multiplicity issue. First we propose an approach based on the control of the posterior expected false discovery rate. We notice that the implied solution ignores the relative size of the increase. This motivates a second approach based on a utility function that includes explicit weights for the size of the increase.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01819.x" xmlns="http://purl.org/rss/1.0/"><title>A Wavelet-Based Bayesian Approach to Regression Models with Long Memory Errors and Its Application to fMRI Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01819.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Wavelet-Based Bayesian Approach to Regression Models with Long Memory Errors and Its Application to fMRI Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jaesik Jeong, Marina Vannucci, Kyungduk Ko</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T13:31:18.527383-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01819.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01819.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01819.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">184</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">196</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1819-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>This article considers linear regression models with long memory errors. These models have been proven useful for application in many areas, such as medical imaging, signal processing, and econometrics. Wavelets, being self-similar, have a strong connection to long memory data. Here we employ discrete wavelet transforms as whitening filters to simplify the dense variance–covariance matrix of the data. We then adopt a Bayesian approach for the estimation of the model parameters. Our inferential procedure uses exact wavelet coefficients variances and leads to accurate estimates of the model parameters. We explore performances on simulated data and present an application to an fMRI data set. In the application we produce posterior probability maps (PPMs) that aid interpretation by identifying voxels that are likely activated with a given confidence.</p></div></div>
]]></content:encoded><description>


This article considers linear regression models with long memory errors. These models have been proven useful for application in many areas, such as medical imaging, signal processing, and econometrics. Wavelets, being self-similar, have a strong connection to long memory data. Here we employ discrete wavelet transforms as whitening filters to simplify the dense variance–covariance matrix of the data. We then adopt a Bayesian approach for the estimation of the model parameters. Our inferential procedure uses exact wavelet coefficients variances and leads to accurate estimates of the model parameters. We explore performances on simulated data and present an application to an fMRI data set. In the application we produce posterior probability maps (PPMs) that aid interpretation by identifying voxels that are likely activated with a given confidence.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01812.x" xmlns="http://purl.org/rss/1.0/"><title>Exploration of Lagged Associations using Longitudinal Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01812.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Exploration of Lagged Associations using Longitudinal Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Patrick J. Heagerty, Bryan A. Comstock</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-01-22T17:25:51.732336-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01812.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01812.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01812.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">197</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">205</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1812-sec-2002" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Several statistical approaches for the analysis of longitudinal data require that models be correctly specified for the association between a current outcome and the full history of past outcomes and time-dependent exposures. It is empirically challenging to determine the specific aspects of the outcome and/or exposure history that are predictive of a current outcome because the potential number of variables representing the history can be quite large. The purpose of this article is to outline statistical methods that can characterize lagged effects and to provide a structured approach for data analysis with the goal of appropriate model development. One of the main contributions of the article is to emphasize the possibility that in practice transition models may frequently require more than simple additive and linear models for the predictors representing the history of the outcome and covariate processes. We illustrate the concepts using an example from anemia treatment for dialysis patients and show how linear models can be specified with flexible dependence on exposure and/or outcome histories.</p></div></div>
]]></content:encoded><description>


Several statistical approaches for the analysis of longitudinal data require that models be correctly specified for the association between a current outcome and the full history of past outcomes and time-dependent exposures. It is empirically challenging to determine the specific aspects of the outcome and/or exposure history that are predictive of a current outcome because the potential number of variables representing the history can be quite large. The purpose of this article is to outline statistical methods that can characterize lagged effects and to provide a structured approach for data analysis with the goal of appropriate model development. One of the main contributions of the article is to emphasize the possibility that in practice transition models may frequently require more than simple additive and linear models for the predictors representing the history of the outcome and covariate processes. We illustrate the concepts using an example from anemia treatment for dialysis patients and show how linear models can be specified with flexible dependence on exposure and/or outcome histories.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01823.x" xmlns="http://purl.org/rss/1.0/"><title>Real-Time Individual Predictions of Prostate Cancer Recurrence Using Joint Models</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01823.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Real-Time Individual Predictions of Prostate Cancer Recurrence Using Joint Models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jeremy M. G. Taylor, Yongseok Park, Donna P. Ankerst, Cecile Proust-Lima, Scott Williams, Larry Kestin, Kyoungwha Bae, Tom Pickles, Howard Sandler</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T13:34:37.718572-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01823.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01823.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01823.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">206</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">213</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1823-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Patients who were previously treated for prostate cancer with radiation therapy are monitored at regular intervals using a laboratory test called Prostate Specific Antigen (PSA). If the value of the PSA test starts to rise, this is an indication that the prostate cancer is more likely to recur, and the patient may wish to initiate new treatments. Such patients could be helped in making medical decisions by an accurate estimate of the probability of recurrence of the cancer in the next few years. In this article, we describe the methodology for giving the probability of recurrence for a new patient, as implemented on a web-based calculator. The methods use a joint longitudinal survival model. The model is developed on a training dataset of 2386 patients and tested on a dataset of 846 patients. Bayesian estimation methods are used with one Markov chain Monte Carlo (MCMC) algorithm developed for estimation of the parameters from the training dataset and a second quick MCMC developed for prediction of the risk of recurrence that uses the longitudinal PSA measures from a new patient.</p></div></div>
]]></content:encoded><description>


Patients who were previously treated for prostate cancer with radiation therapy are monitored at regular intervals using a laboratory test called Prostate Specific Antigen (PSA). If the value of the PSA test starts to rise, this is an indication that the prostate cancer is more likely to recur, and the patient may wish to initiate new treatments. Such patients could be helped in making medical decisions by an accurate estimate of the probability of recurrence of the cancer in the next few years. In this article, we describe the methodology for giving the probability of recurrence for a new patient, as implemented on a web-based calculator. The methods use a joint longitudinal survival model. The model is developed on a training dataset of 2386 patients and tested on a dataset of 846 patients. Bayesian estimation methods are used with one Markov chain Monte Carlo (MCMC) algorithm developed for estimation of the parameters from the training dataset and a second quick MCMC developed for prediction of the risk of recurrence that uses the longitudinal PSA measures from a new patient.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01807.x" xmlns="http://purl.org/rss/1.0/"><title>Modeling Seroadaptation and Sexual Behavior Among HIV+ Study Participants with a Simultaneously Multilevel and Multivariate Longitudinal Count Model</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01807.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Modeling Seroadaptation and Sexual Behavior Among HIV+ Study Participants with a Simultaneously Multilevel and Multivariate Longitudinal Count Model</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yuda Zhu, Robert E. Weiss</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-24T21:55:31.576106-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01807.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01807.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01807.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">214</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">224</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1807-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Longitudinal behavioral intervention trials to reduce HIV transmission risk collect complex multilevel and multivariate data longitudinally for each subject with important correlation structures across time, level, and variables. Accurately assessing the effects of these trials are critical for determining which interventions are effective. Both numbers of partners and numbers of sex acts with each partner are reported at each time point. Sex acts with each partner are further differentiated into protected and unprotected acts with correspondingly differing risks of HIV/STD transmission. These trials generally also have eligibility criteria limiting enrollment to participants with some minimal level of risky sexual behavior tied directly to the outcome of interest. The combination of these factors makes it difficult to quantify sexual behaviors and the effects of intervention. We propose a multivariate multilevel count model that simultaneously models the number of partners, acts within partners, and accounts for recruitment eligibility. Our methods are useful in the evaluation of intervention trials and provide a more accurate and complete model for sexual behavior. We illustrate the contributions of our model by examining seroadaptive behavior defined as risk reducing behavior that depends on the serostatus of the partner. Several forms of seroadaptive risk reducing behavior are quantified and distinguished from nonseroadaptive risk reducing behavior.</p></div></div>
]]></content:encoded><description>


Longitudinal behavioral intervention trials to reduce HIV transmission risk collect complex multilevel and multivariate data longitudinally for each subject with important correlation structures across time, level, and variables. Accurately assessing the effects of these trials are critical for determining which interventions are effective. Both numbers of partners and numbers of sex acts with each partner are reported at each time point. Sex acts with each partner are further differentiated into protected and unprotected acts with correspondingly differing risks of HIV/STD transmission. These trials generally also have eligibility criteria limiting enrollment to participants with some minimal level of risky sexual behavior tied directly to the outcome of interest. The combination of these factors makes it difficult to quantify sexual behaviors and the effects of intervention. We propose a multivariate multilevel count model that simultaneously models the number of partners, acts within partners, and accounts for recruitment eligibility. Our methods are useful in the evaluation of intervention trials and provide a more accurate and complete model for sexual behavior. We illustrate the contributions of our model by examining seroadaptive behavior defined as risk reducing behavior that depends on the serostatus of the partner. Several forms of seroadaptive risk reducing behavior are quantified and distinguished from nonseroadaptive risk reducing behavior.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12002" xmlns="http://purl.org/rss/1.0/"><title>Estimating Time to Disease Progression Comparing Transition Models and Survival Methods—An Analysis of Multiple Sclerosis Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12002</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating Time to Disease Progression Comparing Transition Models and Survival Methods—An Analysis of Multiple Sclerosis Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Micha Mandel, Francois Mercier, Benjamin Eckert, Peter Chin, Rebecca A. Betensky</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-14T14:45:23.165124-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12002</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12002</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12002</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">225</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">234</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom12002-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>This article reports an analysis that aims to quantify the effect of fingolimod, an oral treatment for relapsing remitting multiple sclerosis (MS), on disability progression. The standard approach utilizes survival analysis methods, which may be problematic for MS studies that assess disability at only a few time points and include as a cardinal feature both relapses and remissions. Instead, a Markov transition model, originally developed in the framework of longitudinal data, is fit, and its special probabilistic properties are used to estimate survival curves for time to disability progression. The transition approach models the whole disability process and uses all available transition data for inference, while survival methods concentrate on a single event of interest and use only time to event data. This article compares the transition model approach to survival analysis methods, and discusses the differences in the interpretations of the estimated parameters. It applies both models to data obtained from two phase 3 clinical trials and finds that both yield positive effects for the new treatment compared to placebo, and provide similar estimates for the probability of disability progression over time. The transition model enables calculation of covariate-specific transition matrices that describe the short-term effect of treatment and other covariates on the disability process.</p></div></div>
]]></content:encoded><description>


This article reports an analysis that aims to quantify the effect of fingolimod, an oral treatment for relapsing remitting multiple sclerosis (MS), on disability progression. The standard approach utilizes survival analysis methods, which may be problematic for MS studies that assess disability at only a few time points and include as a cardinal feature both relapses and remissions. Instead, a Markov transition model, originally developed in the framework of longitudinal data, is fit, and its special probabilistic properties are used to estimate survival curves for time to disability progression. The transition approach models the whole disability process and uses all available transition data for inference, while survival methods concentrate on a single event of interest and use only time to event data. This article compares the transition model approach to survival analysis methods, and discusses the differences in the interpretations of the estimated parameters. It applies both models to data obtained from two phase 3 clinical trials and finds that both yield positive effects for the new treatment compared to placebo, and provide similar estimates for the probability of disability progression over time. The transition model enables calculation of covariate-specific transition matrices that describe the short-term effect of treatment and other covariates on the disability process.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01826.x" xmlns="http://purl.org/rss/1.0/"><title>Estimating Strain-Specific and Overall Efficacy of Polyvalent Vaccines Against Recurrent Pathogens From a Cross-Sectional Study</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01826.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating Strain-Specific and Overall Efficacy of Polyvalent Vaccines Against Recurrent Pathogens From a Cross-Sectional Study</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Kari Auranen, Hanna Rinta-Kokko, M. Elizabeth Halloran</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T16:50:11.107953-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01826.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01826.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01826.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">235</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">244</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1826-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Evaluating vaccine efficacy for protection against colonization with bacterial pathogens is an area of growing interest. Colonization of the nasopharynx is an asymptomatic carrier state responsible for person-to-person transmission. It differs from most clinical outcomes in that it is common, recurrent, and observed only in its prevalent state. To estimate rates of acquisition and clearance of colonization requires repeated active sampling of the same individuals over time, an expensive and invasive undertaking. Motivated by feasibility constraints in efficacy trials with colonization endpoints, investigators have been estimating vaccine efficacy from cross-sectional studies without principled methods. We present two examples of vaccine studies estimating vaccine efficacy from cross-sectional data on nasopharyngeal colonization by <em>Streptococcus pneumoniae</em> (pneumococcus). This study presents a framework for defining and estimating strain-specific and overall vaccine efficacy for susceptibility to acquisition of colonization (<img alt="inline equation image" src="http://onlinelibrary.wiley.com/store/10.1111/j.1541-0420.2012.01826.x/asset/equation/biom1826-gra-0001.gif?v=1&amp;s=ec7ecfd2222772dd32edf8cd65d25777a80f8193" class="inlineGraphic"/>) when there is a large number of strains with mutual interactions and recurrent dynamics of colonization. We develop estimators based on one observation of the current status per study subject, evaluate their robustness, and re-analyze the two vaccine trials. Methodologically, the proposed estimators are closely related to case–control studies with prevalent cases, with appropriate consideration of the at-risk time in choosing the controls.</p></div></div>
]]></content:encoded><description>


Evaluating vaccine efficacy for protection against colonization with bacterial pathogens is an area of growing interest. Colonization of the nasopharynx is an asymptomatic carrier state responsible for person-to-person transmission. It differs from most clinical outcomes in that it is common, recurrent, and observed only in its prevalent state. To estimate rates of acquisition and clearance of colonization requires repeated active sampling of the same individuals over time, an expensive and invasive undertaking. Motivated by feasibility constraints in efficacy trials with colonization endpoints, investigators have been estimating vaccine efficacy from cross-sectional studies without principled methods. We present two examples of vaccine studies estimating vaccine efficacy from cross-sectional data on nasopharyngeal colonization by Streptococcus pneumoniae (pneumococcus). This study presents a framework for defining and estimating strain-specific and overall vaccine efficacy for susceptibility to acquisition of colonization () when there is a large number of strains with mutual interactions and recurrent dynamics of colonization. We develop estimators based on one observation of the current status per study subject, evaluate their robustness, and re-analyze the two vaccine trials. Methodologically, the proposed estimators are closely related to case–control studies with prevalent cases, with appropriate consideration of the at-risk time in choosing the controls.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01831.x" xmlns="http://purl.org/rss/1.0/"><title>A Semiparametric Censoring Bias Model for Estimating the Cumulative Risk of a False-Positive Screening Test Under Dependent Censoring</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01831.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Semiparametric Censoring Bias Model for Estimating the Cumulative Risk of a False-Positive Screening Test Under Dependent Censoring</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Rebecca A. Hubbard, Diana L. Miglioretti</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-05T15:12:26.484582-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01831.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01831.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01831.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">245</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">253</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1831-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>False-positive test results are among the most common harms of screening tests and may lead to more invasive and expensive diagnostic testing procedures. Estimating the cumulative risk of a false-positive screening test result after repeat screening rounds is, therefore, important for evaluating potential screening regimens. Existing estimators of the cumulative false-positive risk are limited by strong assumptions about censoring mechanisms and parametric assumptions about variation in risk across screening rounds. To address these limitations, we propose a semiparametric censoring bias model for cumulative false-positive risk that allows for dependent censoring without specifying a fixed functional form for variation in risk across screening rounds. Simulation studies demonstrated that the censoring bias model performs similarly to existing models under independent censoring and can largely eliminate bias under dependent censoring. We used the existing and newly proposed models to estimate the cumulative false-positive risk and variation in risk as a function of baseline age and family history of breast cancer after 10 years of annual screening mammography using data from the Breast Cancer Surveillance Consortium. Ignoring potential dependent censoring in this context leads to underestimation of the cumulative risk of false-positive results. Models that provide accurate estimates under dependent censoring are critical for providing appropriate information for evaluating screening tests.</p></div></div>
]]></content:encoded><description>


False-positive test results are among the most common harms of screening tests and may lead to more invasive and expensive diagnostic testing procedures. Estimating the cumulative risk of a false-positive screening test result after repeat screening rounds is, therefore, important for evaluating potential screening regimens. Existing estimators of the cumulative false-positive risk are limited by strong assumptions about censoring mechanisms and parametric assumptions about variation in risk across screening rounds. To address these limitations, we propose a semiparametric censoring bias model for cumulative false-positive risk that allows for dependent censoring without specifying a fixed functional form for variation in risk across screening rounds. Simulation studies demonstrated that the censoring bias model performs similarly to existing models under independent censoring and can largely eliminate bias under dependent censoring. We used the existing and newly proposed models to estimate the cumulative false-positive risk and variation in risk as a function of baseline age and family history of breast cancer after 10 years of annual screening mammography using data from the Breast Cancer Surveillance Consortium. Ignoring potential dependent censoring in this context leads to underestimation of the cumulative risk of false-positive results. Models that provide accurate estimates under dependent censoring are critical for providing appropriate information for evaluating screening tests.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01829.x" xmlns="http://purl.org/rss/1.0/"><title>An Application of Targeted Maximum Likelihood Estimation to the Meta-Analysis of Safety Data</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01829.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">An Application of Targeted Maximum Likelihood Estimation to the Meta-Analysis of Safety Data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Susan Gruber, Mark J. van der Laan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T17:54:25.211384-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01829.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01829.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01829.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">254</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">262</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1829-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Safety analysis to estimate the effect of a treatment on an adverse event poses a challenging statistical problem even in randomized controlled trials because these events are typically rare, so studies originally powered for efficacy are underpowered for safety outcomes. A meta-analysis of data pooled across multiple studies may increase power, but missingness in the outcome or failed randomization can introduce bias. This article illustrates how targeted maximum likelihood estimation (TMLE) can be applied in a meta-analysis to reduce bias in causal effect estimates, and compares performance with other estimators in the literature. A simulation study in which missingness in the outcome is at random or completely at random highlights the differences in estimators with respect to the potential gains in bias and efficiency. Risk difference, relative risk, and odds ratio of the effect of treatment on 30-daymortality are estimated from data from eight randomized controlled trials. When an outcome event is rare there may be little opportunity to improve efficiency, and associations between covariates and the outcome may be hard to detect. TMLE attempts to exploit the available information to either meet or exceed the performance of a less sophisticated estimator.</p></div></div>
]]></content:encoded><description>


Safety analysis to estimate the effect of a treatment on an adverse event poses a challenging statistical problem even in randomized controlled trials because these events are typically rare, so studies originally powered for efficacy are underpowered for safety outcomes. A meta-analysis of data pooled across multiple studies may increase power, but missingness in the outcome or failed randomization can introduce bias. This article illustrates how targeted maximum likelihood estimation (TMLE) can be applied in a meta-analysis to reduce bias in causal effect estimates, and compares performance with other estimators in the literature. A simulation study in which missingness in the outcome is at random or completely at random highlights the differences in estimators with respect to the potential gains in bias and efficiency. Risk difference, relative risk, and odds ratio of the effect of treatment on 30-daymortality are estimated from data from eight randomized controlled trials. When an outcome event is rare there may be little opportunity to improve efficiency, and associations between covariates and the outcome may be hard to detect. TMLE attempts to exploit the available information to either meet or exceed the performance of a less sophisticated estimator.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01830.x" xmlns="http://purl.org/rss/1.0/"><title>Model Feedback in Bayesian Propensity Score Estimation</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01830.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Model Feedback in Bayesian Propensity Score Estimation</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Corwin M. Zigler, Krista Watts, Robert W. Yeh, Yun Wang, Brent A. Coull, Francesca Dominici</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T16:34:55.575496-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01830.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01830.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01830.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">263</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">273</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1830-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Methods based on the propensity score comprise one set of valuable tools for comparative effectiveness research and for estimating causal effects more generally. These methods typically consist of two distinct stages: (1) a propensity score stage where a model is fit to predict the propensity to receive treatment (the propensity score), and (2) an outcome stage where responses are compared in treated and untreated units having similar values of the estimated propensity score. Traditional techniques conduct estimation in these two stages separately; estimates from the first stage are treated as fixed and known for use in the second stage. Bayesian methods have natural appeal in these settings because separate likelihoods for the two stages can be combined into a single joint likelihood, with estimation of the two stages carried out simultaneously. One key feature of joint estimation in this context is “feedback” between the outcome stage and the propensity score stage, meaning that quantities in a model for the outcome contribute information to posterior distributions of quantities in the model for the propensity score. We provide a rigorous assessment of Bayesian propensity score estimation to show that model feedback can produce poor estimates of causal effects absent strategies that augment propensity score adjustment with adjustment for individual covariates. We illustrate this phenomenon with a simulation study and with a comparative effectiveness investigation of carotid artery stenting versus carotid endarterectomy among 123,286 Medicare beneficiaries hospitlized for stroke in 2006 and 2007.</p></div></div>
]]></content:encoded><description>


Methods based on the propensity score comprise one set of valuable tools for comparative effectiveness research and for estimating causal effects more generally. These methods typically consist of two distinct stages: (1) a propensity score stage where a model is fit to predict the propensity to receive treatment (the propensity score), and (2) an outcome stage where responses are compared in treated and untreated units having similar values of the estimated propensity score. Traditional techniques conduct estimation in these two stages separately; estimates from the first stage are treated as fixed and known for use in the second stage. Bayesian methods have natural appeal in these settings because separate likelihoods for the two stages can be combined into a single joint likelihood, with estimation of the two stages carried out simultaneously. One key feature of joint estimation in this context is “feedback” between the outcome stage and the propensity score stage, meaning that quantities in a model for the outcome contribute information to posterior distributions of quantities in the model for the propensity score. We provide a rigorous assessment of Bayesian propensity score estimation to show that model feedback can produce poor estimates of causal effects absent strategies that augment propensity score adjustment with adjustment for individual covariates. We illustrate this phenomenon with a simulation study and with a comparative effectiveness investigation of carotid artery stenting versus carotid endarterectomy among 123,286 Medicare beneficiaries hospitlized for stroke in 2006 and 2007.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01824.x" xmlns="http://purl.org/rss/1.0/"><title>Equivalence of MAXENT and Poisson Point Process Models for Species Distribution Modeling in Ecology</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01824.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Equivalence of MAXENT and Poisson Point Process Models for Species Distribution Modeling in Ecology</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ian W. Renner, David I. Warton</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-02-04T17:54:20.032438-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01824.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01824.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01824.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Original Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">274</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">281</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1824-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>Modeling the spatial distribution of a species is a fundamental problem in ecology. A number of modeling methods have been developed, an extremely popular one being MAXENT, a maximum entropy modeling approach. In this article, we show that MAXENT is equivalent to a Poisson regression model and hence is related to a Poisson point process model, differing only in the intercept term, which is scale-dependent in MAXENT. We illustrate a number of improvements to MAXENT that follow from these relations. In particular, a point process model approach facilitates methods for choosing the appropriate spatial resolution, assessing model adequacy, and choosing the LASSO penalty parameter, all currently unavailable to MAXENT. The equivalence result represents a significant step in the unification of the species distribution modeling literature.</p></div></div>
]]></content:encoded><description>


Modeling the spatial distribution of a species is a fundamental problem in ecology. A number of modeling methods have been developed, an extremely popular one being MAXENT, a maximum entropy modeling approach. In this article, we show that MAXENT is equivalent to a Poisson regression model and hence is related to a Poisson point process model, differing only in the intercept term, which is scale-dependent in MAXENT. We illustrate a number of improvements to MAXENT that follow from these relations. In particular, a point process model approach facilitates methods for choosing the appropriate spatial resolution, assessing model adequacy, and choosing the LASSO penalty parameter, all currently unavailable to MAXENT. The equivalence result represents a significant step in the unification of the species distribution modeling literature.

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01798.x" xmlns="http://purl.org/rss/1.0/"><title>A Note on Using Regression Models to Analyze Randomized Trials: Asymptotically Valid Hypothesis Tests Despite Incorrectly Specified Models</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01798.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Note on Using Regression Models to Analyze Randomized Trials: Asymptotically Valid Hypothesis Tests Despite Incorrectly Specified Models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jane Paik Kim</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-28T11:20:40.517356-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01798.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01798.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01798.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Reader Reaction</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">282</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">289</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Summary</h3>
<div class="section" id="biom1798-sec-0001" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>In the context of randomized trials, Rosenblum and van der Laan (2009, <em>Biometrics</em> <b>63</b>, 937–945) considered the null hypothesis of no treatment effect on the mean outcome within strata of baseline variables. They showed that hypothesis tests based on linear regression models and generalized linear regression models are guaranteed to have asymptotically correct Type I error regardless of the actual data generating distribution, assuming the treatment assignment is independent of covariates. We consider another important outcome in randomized trials, the time from randomization until failure, and the null hypothesis of no treatment effect on the survivor function conditional on a set of baseline variables. By a direct application of arguments in Rosenblum and van der Laan (2009), we show that hypothesis tests based on multiplicative hazards models with an exponential link, i.e., proportional hazards models, and multiplicative hazards models with linear link functions where the baseline hazard is parameterized, are asymptotically valid under model misspecification provided that the censoring distribution is independent of the treatment assignment given the covariates. In the case of the Cox model and linear link model with unspecified baseline hazard function, the arguments in Rosenblum and van der Laan (2009) cannot be applied to show the robustness of a misspecified model. Instead, we adopt an approach used in previous literature (Struthers and Kalbfleisch, 1986, <em>Biometrika</em> <b>73</b>, 363–369) to show that hypothesis tests based on these models, including models with interaction terms, have correct type I error.</p></div></div>
]]></content:encoded><description>


In the context of randomized trials, Rosenblum and van der Laan (2009, Biometrics 63, 937–945) considered the null hypothesis of no treatment effect on the mean outcome within strata of baseline variables. They showed that hypothesis tests based on linear regression models and generalized linear regression models are guaranteed to have asymptotically correct Type I error regardless of the actual data generating distribution, assuming the treatment assignment is independent of covariates. We consider another important outcome in randomized trials, the time from randomization until failure, and the null hypothesis of no treatment effect on the survivor function conditional on a set of baseline variables. By a direct application of arguments in Rosenblum and van der Laan (2009), we show that hypothesis tests based on multiplicative hazards models with an exponential link, i.e., proportional hazards models, and multiplicative hazards models with linear link functions where the baseline hazard is parameterized, are asymptotically valid under model misspecification provided that the censoring distribution is independent of the treatment assignment given the covariates. In the case of the Cox model and linear link model with unspecified baseline hazard function, the arguments in Rosenblum and van der Laan (2009) cannot be applied to show the robustness of a misspecified model. Instead, we adopt an approach used in previous literature (Struthers and Kalbfleisch, 1986, Biometrika 73, 363–369) to show that hypothesis tests based on these models, including models with interaction terms, have correct type I error.
</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01799.x" xmlns="http://purl.org/rss/1.0/"><title>Rejoinder to “A Note on Using Regression Models to Analyze Randomized Trials: Asymptotically Valid Hypothesis Tests Despite Incorrectly Specified Models”</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01799.x</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Rejoinder to “A Note on Using Regression Models to Analyze Randomized Trials: Asymptotically Valid Hypothesis Tests Despite Incorrectly Specified Models”</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Michael Rosenblum, Mark J. van der Laan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-09-28T11:22:20.997738-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/j.1541-0420.2012.01799.x</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/j.1541-0420.2012.01799.x</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fj.1541-0420.2012.01799.x</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Reader Reaction</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">290</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">290</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[]]></content:encoded><description/></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12028" xmlns="http://purl.org/rss/1.0/"><title>Statistics of Medical Imaging by LEI, T.</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12028</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Statistics of Medical Imaging by LEI, T.</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Hongtu Zhu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-05T12:32:32.64833-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12028</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12028</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12028</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Book Review</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">291</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">292</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<div class="section" id="biom12002-sec-0001" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><div class="para"><p>EDITOR: GUILHERME J. M. ROSA</p></div><div class="para"><p><b>Statistics of Medical Imaging</b></p></div><div class="para"><p>(T. Lei)</p></div><div class="para"><p><em>Hongtu Zhu</em></p></div><div class="para"><p><b>Bayesian Smoothing and Regression for Longitudinal, Spatial and Event History Data</b></p></div><div class="para"><p>(L. Fahrmeir and T. Kneib)</p></div><div class="para"><p><em>Renato Assunção</em></p></div><div class="para"><p><b>Targeted Learning</b></p></div><div class="para"><p>(M. van der Laan and S. Rose)</p></div><div class="para"><p><em>Andrea Rotnitzky</em></p></div></div>
]]></content:encoded><description>

EDITOR: GUILHERME J. M. ROSA
Statistics of Medical Imaging
(T. Lei)
Hongtu Zhu
Bayesian Smoothing and Regression for Longitudinal, Spatial and Event History Data
(L. Fahrmeir and T. Kneib)
Renato Assunção
Targeted Learning
(M. van der Laan and S. Rose)
Andrea Rotnitzky

</description></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12029" xmlns="http://purl.org/rss/1.0/"><title>Bayesian Smoothing and Regression for Longitudinal, Spatial and Event History Data by FAHRMEIR, L. and KNEIB, T.</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12029</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian Smoothing and Regression for Longitudinal, Spatial and Event History Data by FAHRMEIR, L. and KNEIB, T.</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Renato Assunção</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-05T12:32:32.64833-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12029</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12029</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12029</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Book Review</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">292</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">292</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[]]></content:encoded><description/></item><item rdf:about="http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12030" xmlns="http://purl.org/rss/1.0/"><title>Targeted Learning by VAN DER LAAN, M. and ROSE, S.</title><link>http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12030</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Targeted Learning by VAN DER LAAN, M. and ROSE, S.</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Andrea Rotnitzky</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2013-04-05T12:32:32.64833-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1111/biom.12030</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1111/biom.12030</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://onlinelibrary.wiley.com/resolve/doi?DOI=10.1111%2Fbiom.12030</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Book Review</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">293</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">293</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[]]></content:encoded><description/></item></rdf:RDF>