<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet href="http://onlinelibrarystatic.wiley.com/xslt/wol-journal-rss.xsl"
            type="text/xsl"?><rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"><channel rdf:about="http://onlinelibrary.wiley.com/rss/journal/10.1002/(ISSN)1097-0258" xmlns="http://purl.org/rss/1.0/"><title>Statistics in Medicine</title><description> Wiley Online Library : Statistics in Medicine</description><link>http://dx.doi.org/10.1002%2F%28ISSN%291097-0258</link><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc</dc:publisher><dc:language xmlns:dc="http://purl.org/dc/elements/1.1/">en</dc:language><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/">© John Wiley &amp; Sons, Ltd.</dc:rights><prism:issn xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">0277-6715</prism:issn><prism:eIssn xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">1097-0258</prism:eIssn><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><prism:coverDisplayDate xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">15 March 2012</prism:coverDisplayDate><prism:volume xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">31</prism:volume><prism:number xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">6</prism:number><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">501</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">600</prism:endingPage><image rdf:resource="http://onlinelibrary.wiley.com/store/10.1002/sim.v31.6/asset/cover.gif?v=1&amp;s=1e845a692be4ec152c3c0cc2495d821434960687"/><items><rdf:Seq><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4509"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4479"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.5309"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4476"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4492"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4455"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4477"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4478"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4474"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4464"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4439"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4465"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4457"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4463"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4462"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4409"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4461"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4443"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4440"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4447"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4416"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4437"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4417"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4435"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4419"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4418"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4343"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4359"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4385"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4387"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4404"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4357"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4389"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4371"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4370"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4391"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4354"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4386"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4390"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4335"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4384"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4367"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4369"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4345"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4363"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4356"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4304"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4275"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4242"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4146"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4168"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4003"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4034"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.3980"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4432"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4425"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4423"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4420"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4450"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4438"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4456"/><rdf:li rdf:resource="http://dx.doi.org/10.1002%2Fsim.4436"/></rdf:Seq></items></channel><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4509" xmlns="http://purl.org/rss/1.0/"><title>Classification accuracy and cut point selection</title><link>http://dx.doi.org/10.1002%2Fsim.4509</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Classification accuracy and cut point selection</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xinhua Liu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T09:26:00.55831-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4509</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4509</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4509</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In biomedical research and practice, quantitative tests or biomarkers are often used for diagnostic or screening purposes, with a cut point established on the quantitative measurement to aid binary classification. This paper introduces an alternative to the traditional methods based on the Youden index and the closest-to-(0, 1) criterion for threshold selection. A concordance probability evaluating the classification accuracy of a dichotomized measure is defined as an objective function of the possible cut point. A nonparametric approach is used to search for the optimal cut point maximizing the objective function. The procedure is shown to perform well in a simulation study. Using data from a real-world study of arsenic-induced skin lesions, we apply the method to a measure of blood arsenic levels, selecting a cut point to be used as a warning threshold. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In biomedical research and practice, quantitative tests or biomarkers are often used for diagnostic or screening purposes, with a cut point established on the quantitative measurement to aid binary classification. This paper introduces an alternative to the traditional methods based on the Youden index and the closest-to-(0, 1) criterion for threshold selection. A concordance probability evaluating the classification accuracy of a dichotomized measure is defined as an objective function of the possible cut point. A nonparametric approach is used to search for the optimal cut point maximizing the objective function. The procedure is shown to perform well in a simulation study. Using data from a real-world study of arsenic-induced skin lesions, we apply the method to a measure of blood arsenic levels, selecting a cut point to be used as a warning threshold. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4479" xmlns="http://purl.org/rss/1.0/"><title>General joint frailty model for recurrent event data with a dependent terminal event: Application to follicular lymphoma data</title><link>http://dx.doi.org/10.1002%2Fsim.4479</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">General joint frailty model for recurrent event data with a dependent terminal event: Application to follicular lymphoma data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yassin Mazroui</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Simone Mathoulin-Pelissier</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Pierre Soubeyran</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Virginie Rondeau</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T08:34:26.666682-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4479</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4479</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4479</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Many biomedical studies focus on delaying disease relapses and on prolonging survival. Usual methods only consider one event, often the first recurrence or death. However, ignoring the other recurrences may lead to biased results. The whole history of the disease should be considered for each patient. In addition, some diseases involve recurrences that can increase the risk of death. In this case, the death time may be dependent on the recurrent event history. We propose a joint frailty model to analyze recurrences and death simultaneously. Two gamma-distributed frailties take into account both the inter-recurrences dependence and the dependence between the recurrences and the survival times. We estimate separate parameters for disease recurrent event times and survival times in the joint frailty model to distinguish treatment effects and prognostic factors on these two types of events. We show how maximum penalized likelihood estimation can be applied to semiparametric estimation of the continuous hazard functions in the proposed joint frailty model with right censoring. We also propose parametrical approach. We evaluate the model by simulation studies and illustrate through a study of patients with follicular lymphoma. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Many biomedical studies focus on delaying disease relapses and on prolonging survival. Usual methods only consider one event, often the first recurrence or death. However, ignoring the other recurrences may lead to biased results. The whole history of the disease should be considered for each patient. In addition, some diseases involve recurrences that can increase the risk of death. In this case, the death time may be dependent on the recurrent event history. We propose a joint frailty model to analyze recurrences and death simultaneously. Two gamma-distributed frailties take into account both the inter-recurrences dependence and the dependence between the recurrences and the survival times. We estimate separate parameters for disease recurrent event times and survival times in the joint frailty model to distinguish treatment effects and prognostic factors on these two types of events. We show how maximum penalized likelihood estimation can be applied to semiparametric estimation of the continuous hazard functions in the proposed joint frailty model with right censoring. We also propose parametrical approach. We evaluate the model by simulation studies and illustrate through a study of patients with follicular lymphoma. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.5309" xmlns="http://purl.org/rss/1.0/"><title>A nonparametric test for equality of survival medians</title><link>http://dx.doi.org/10.1002%2Fsim.5309</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A nonparametric test for equality of survival medians</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Mohammad H. Rahbar</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhongxue Chen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sangchoon Jeon</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Joseph C. Gardiner</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jing Ning</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:52:36.600178-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.5309</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.5309</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.5309</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>In clinical trials, researchers often encounter testing for equality of survival medians across study arms based on censored data. Even though Brookmeyer and Crowley introduced a method for comparing medians of several survival distributions, still some researchers misuse procedures that are designed for testing the homogeneity of survival curves. These procedures include the log-rank, Wilcoxon, and Cox models. This practice leads to inflation of the probability of a type I error, particularly when the underlying assumptions of these procedures are not met. We propose a new nonparametric method for testing the equality of several survival medians based on the Kaplan–Meier estimation from randomly right-censored data. We derive asymptotic properties of this test statistic. Through simulations, we compute and compare the empirical probabilities of type I errors and the power of this new procedure with those of the Brookmeyer–Crowley, log-rank, and Wilcoxon methods.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>Our simulation results indicate that the performance of these test procedures depends on the level of censoring and appropriateness of the underlying assumptions. When the objective is to test homogeneity of survival medians rather than survival curves and the assumptions of these tests are not met, some of these procedures severely inflate the probability of a type I error. In these situations, our test statistic provides an alternative to the Brookmeyer–Crowley test. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In clinical trials, researchers often encounter testing for equality of survival medians across study arms based on censored data. Even though Brookmeyer and Crowley introduced a method for comparing medians of several survival distributions, still some researchers misuse procedures that are designed for testing the homogeneity of survival curves. These procedures include the log-rank, Wilcoxon, and Cox models. This practice leads to inflation of the probability of a type I error, particularly when the underlying assumptions of these procedures are not met. We propose a new nonparametric method for testing the equality of several survival medians based on the Kaplan–Meier estimation from randomly right-censored data. We derive asymptotic properties of this test statistic. Through simulations, we compute and compare the empirical probabilities of type I errors and the power of this new procedure with those of the Brookmeyer–Crowley, log-rank, and Wilcoxon methods.Our simulation results indicate that the performance of these test procedures depends on the level of censoring and appropriateness of the underlying assumptions. When the objective is to test homogeneity of survival medians rather than survival curves and the assumptions of these tests are not met, some of these procedures severely inflate the probability of a type I error. In these situations, our test statistic provides an alternative to the Brookmeyer–Crowley test. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4476" xmlns="http://purl.org/rss/1.0/"><title>Predictive power to assist phase 3 go/no go decision based on phase 2 data on a different endpoint</title><link>http://dx.doi.org/10.1002%2Fsim.4476</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Predictive power to assist phase 3 go/no go decision based on phase 2 data on a different endpoint</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Shengyan Hong</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Li Shi</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:52:24.435486-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4476</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4476</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4476</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>One of the most critical decision points during drug development is to make a phase 3 go/no go decision after a phase 2 proof of concept trial is conducted. It is particularly challenging in oncology drug development where oftentimes the primary endpoint for phase 3 trial is overall survival (OS), but the phase 2 proof of concept trial is powered only for an early endpoint, typically progression-free survival (PFS), whose relationship to OS is often unclear. We propose the use of predictive power to assist the phase 3 go/no go decision by evaluating the strength of actual observed phase 2 efficacy effects in terms of how likely it will predict the chance of OS success in the subsequent phase 3 trial. The formula is provided for calculation of predictive power based on either observed PFS effect only, or observed OS effect only, or both. An example is provided to compare these three predictive powers, which shows that when there is little prior information about PFS and OS, the predictability based on the observed phase 2 PFS effect is low and not sensitive to the size of the trial and extent of the observed PFS effect, and it also has limited added value to the predictability based on the observed phase 2 OS effect. Therefore, one should be cautious of inherently high risk of making a phase 3 go/no go decision based on phase 2 PFS outcome alone and should take the phase 2 OS data into consideration whenever possible. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>One of the most critical decision points during drug development is to make a phase 3 go/no go decision after a phase 2 proof of concept trial is conducted. It is particularly challenging in oncology drug development where oftentimes the primary endpoint for phase 3 trial is overall survival (OS), but the phase 2 proof of concept trial is powered only for an early endpoint, typically progression-free survival (PFS), whose relationship to OS is often unclear. We propose the use of predictive power to assist the phase 3 go/no go decision by evaluating the strength of actual observed phase 2 efficacy effects in terms of how likely it will predict the chance of OS success in the subsequent phase 3 trial. The formula is provided for calculation of predictive power based on either observed PFS effect only, or observed OS effect only, or both. An example is provided to compare these three predictive powers, which shows that when there is little prior information about PFS and OS, the predictability based on the observed phase 2 PFS effect is low and not sensitive to the size of the trial and extent of the observed PFS effect, and it also has limited added value to the predictability based on the observed phase 2 OS effect. Therefore, one should be cautious of inherently high risk of making a phase 3 go/no go decision based on phase 2 PFS outcome alone and should take the phase 2 OS data into consideration whenever possible. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4492" xmlns="http://purl.org/rss/1.0/"><title>Identifying representative trees from ensembles</title><link>http://dx.doi.org/10.1002%2Fsim.4492</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Identifying representative trees from ensembles</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Mousumi Banerjee</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ying Ding</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Anne-Michelle Noone</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:50:36.582458-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4492</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4492</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4492</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Tree-based methods have become popular for analyzing complex data structures where the primary goal is risk stratification of patients. Ensemble techniques improve the accuracy in prediction and address the instability in a single tree by growing an ensemble of trees and aggregating. However, in the process, individual trees get lost. In this paper, we propose a methodology for identifying the most representative trees in an ensemble on the basis of several tree distance metrics. Although our focus is on binary outcomes, the methods are applicable to censored data as well. For any two trees, the distance metrics are chosen to (1) measure similarity of the covariates used to split the trees; (2) reflect similar clustering of patients in the terminal nodes of the trees; and (3) measure similarity in predictions from the two trees. Whereas the latter focuses on prediction, the first two metrics focus on the architectural similarity between two trees. The most representative trees in the ensemble are chosen on the basis of the average distance between a tree and all other trees in the ensemble. Out-of-bag estimate of error rate is obtained using neighborhoods of representative trees. Simulations and data examples show gains in predictive accuracy when averaging over such neighborhoods. We illustrate our methods using a dataset of kidney cancer treatment receipt (binary outcome) and a second dataset of breast cancer survival (censored outcome). Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Tree-based methods have become popular for analyzing complex data structures where the primary goal is risk stratification of patients. Ensemble techniques improve the accuracy in prediction and address the instability in a single tree by growing an ensemble of trees and aggregating. However, in the process, individual trees get lost. In this paper, we propose a methodology for identifying the most representative trees in an ensemble on the basis of several tree distance metrics. Although our focus is on binary outcomes, the methods are applicable to censored data as well. For any two trees, the distance metrics are chosen to (1) measure similarity of the covariates used to split the trees; (2) reflect similar clustering of patients in the terminal nodes of the trees; and (3) measure similarity in predictions from the two trees. Whereas the latter focuses on prediction, the first two metrics focus on the architectural similarity between two trees. The most representative trees in the ensemble are chosen on the basis of the average distance between a tree and all other trees in the ensemble. Out-of-bag estimate of error rate is obtained using neighborhoods of representative trees. Simulations and data examples show gains in predictive accuracy when averaging over such neighborhoods. We illustrate our methods using a dataset of kidney cancer treatment receipt (binary outcome) and a second dataset of breast cancer survival (censored outcome). Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4455" xmlns="http://purl.org/rss/1.0/"><title>Multilevel latent variable models for global health-related quality of life assessment</title><link>http://dx.doi.org/10.1002%2Fsim.4455</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Multilevel latent variable models for global health-related quality of life assessment</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Annette Kifley</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Gillian Z. Heller</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ken J. Beath</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">David Bulger</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jun Ma</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Val Gebski</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:46:13.200302-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4455</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4455</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4455</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Quality of life (QOL) assessment is a key component of many clinical studies and frequently requires the use of single global summary measures that capture the overall balance of findings from a potentially wide-ranging assessment of QOL issues. We propose and evaluate an irregular multilevel latent variable model suitable for use as a global summary tool for health-related QOL assessments. The proposed model is a multiple indicator and multiple cause style of model with a two-level latent variable structure. We approach the modeling from a general multilevel modeling perspective, using a combination of random and nonrandom cluster types to accommodate the mixture of issues commonly evaluated in health-related QOL assessments—overall perceptions of QOL and health, along with specific psychological, physical, social, and functional issues. Using clinical trial data, we evaluate the merits and application of this approach in detail, both for mean global QOL and for change from baseline. We show that the proposed model generally performs well in comparing global patterns of treatment effect and provides more precise and reliable estimates than several common alternatives such as selecting from or averaging observed global item measures. A variety of computational methods could be used for estimation. We derived a closed-form expression for the marginal likelihood that can be used to obtain maximum likelihood parameter estimates when normality assumptions are reasonable. Our approach is useful for QOL evaluations aimed at pharmacoeconomic or individual clinical decision making and in obtaining summary QOL measures for use in quality-adjusted survival analyses. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Quality of life (QOL) assessment is a key component of many clinical studies and frequently requires the use of single global summary measures that capture the overall balance of findings from a potentially wide-ranging assessment of QOL issues. We propose and evaluate an irregular multilevel latent variable model suitable for use as a global summary tool for health-related QOL assessments. The proposed model is a multiple indicator and multiple cause style of model with a two-level latent variable structure. We approach the modeling from a general multilevel modeling perspective, using a combination of random and nonrandom cluster types to accommodate the mixture of issues commonly evaluated in health-related QOL assessments—overall perceptions of QOL and health, along with specific psychological, physical, social, and functional issues. Using clinical trial data, we evaluate the merits and application of this approach in detail, both for mean global QOL and for change from baseline. We show that the proposed model generally performs well in comparing global patterns of treatment effect and provides more precise and reliable estimates than several common alternatives such as selecting from or averaging observed global item measures. A variety of computational methods could be used for estimation. We derived a closed-form expression for the marginal likelihood that can be used to obtain maximum likelihood parameter estimates when normality assumptions are reasonable. Our approach is useful for QOL evaluations aimed at pharmacoeconomic or individual clinical decision making and in obtaining summary QOL measures for use in quality-adjusted survival analyses. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4477" xmlns="http://purl.org/rss/1.0/"><title>A pathway analysis method for genome-wide association studies</title><link>http://dx.doi.org/10.1002%2Fsim.4477</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A pathway analysis method for genome-wide association studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Babak Shahbaba</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Catherine M. Shachaf</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhaoxia Yu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:39:18.232792-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4477</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4477</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4477</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>For genome-wide association studies, we propose a new method for identifying significant biological pathways. In this approach, we aggregate data across single-nucleotide polymorphisms to obtain summary measures at the gene level. We then use a hierarchical Bayesian model, which takes the gene-level summary measures as data, in order to evaluate the relevance of each pathway to an outcome of interest (e.g., disease status). Although shifting the focus of analysis from individual genes to pathways has proven to improve the statistical power and provide more robust results, such methods tend to eliminate a large number of genes whose pathways are unknown. For these genes, we propose to use a Bayesian multinomial logit model to predict the associated pathways by using the genes with known pathways as the training data. Our hierarchical Bayesian model takes the uncertainty regarding the pathway predictions into account while assessing the significance of pathways. We apply our method to two independent studies on type 2 diabetes and show that the overlap between the results from the two studies is statistically significant. We also evaluate our approach on the basis of simulated data. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>For genome-wide association studies, we propose a new method for identifying significant biological pathways. In this approach, we aggregate data across single-nucleotide polymorphisms to obtain summary measures at the gene level. We then use a hierarchical Bayesian model, which takes the gene-level summary measures as data, in order to evaluate the relevance of each pathway to an outcome of interest (e.g., disease status). Although shifting the focus of analysis from individual genes to pathways has proven to improve the statistical power and provide more robust results, such methods tend to eliminate a large number of genes whose pathways are unknown. For these genes, we propose to use a Bayesian multinomial logit model to predict the associated pathways by using the genes with known pathways as the training data. Our hierarchical Bayesian model takes the uncertainty regarding the pathway predictions into account while assessing the significance of pathways. We apply our method to two independent studies on type 2 diabetes and show that the overlap between the results from the two studies is statistically significant. We also evaluate our approach on the basis of simulated data. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4478" xmlns="http://purl.org/rss/1.0/"><title>A mixed non-homogeneous hidden Markov model for categorical data, with application to alcohol consumption</title><link>http://dx.doi.org/10.1002%2Fsim.4478</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A mixed non-homogeneous hidden Markov model for categorical data, with application to alcohol consumption</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Antonello Maruotti</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Roberto Rocci</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:29:14.859715-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4478</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4478</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4478</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Hidden Markov models (HMMs) are frequently used to analyse longitudinal data, where the same set of subjects is repeatedly observed over time. In this context, several sources of heterogeneity may arise at individual and/or time level, which affect the hidden process, that is, the transition probabilities between the hidden states. In this paper, we propose the use of a finite mixture of non-homogeneous HMMs (NH-HMMs) to face the heterogeneity problem. The non-homogeneity of the model allows us to take into account observed sources of heterogeneity by means of a proper set of covariates, time and/or individual dependent, explaining the variations in the transition probabilities. Moreover, we handle the unobserved sources of heterogeneity at the individual level, due to, for example, omitted covariates, by introducing a random term with a discrete distribution. The resulting model is a finite mixture of NH-HMM that can be used to classify individuals according to their dynamic behaviour or to estimate a mixed NH-HMM without any assumption regarding the distribution of the random term following the non-parametric maximum likelihood approach. We test the effectiveness of the proposal through a simulation study and an application to real data on alcohol abuse. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Hidden Markov models (HMMs) are frequently used to analyse longitudinal data, where the same set of subjects is repeatedly observed over time. In this context, several sources of heterogeneity may arise at individual and/or time level, which affect the hidden process, that is, the transition probabilities between the hidden states. In this paper, we propose the use of a finite mixture of non-homogeneous HMMs (NH-HMMs) to face the heterogeneity problem. The non-homogeneity of the model allows us to take into account observed sources of heterogeneity by means of a proper set of covariates, time and/or individual dependent, explaining the variations in the transition probabilities. Moreover, we handle the unobserved sources of heterogeneity at the individual level, due to, for example, omitted covariates, by introducing a random term with a discrete distribution. The resulting model is a finite mixture of NH-HMM that can be used to classify individuals according to their dynamic behaviour or to estimate a mixed NH-HMM without any assumption regarding the distribution of the random term following the non-parametric maximum likelihood approach. We test the effectiveness of the proposal through a simulation study and an application to real data on alcohol abuse. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4474" xmlns="http://purl.org/rss/1.0/"><title>On the covariance of two correlated log-odds ratios</title><link>http://dx.doi.org/10.1002%2Fsim.4474</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">On the covariance of two correlated log-odds ratios</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Pantelis G. Bagos</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-02-03T03:29:06.872449-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4474</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4474</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4474</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In many applications two correlated estimates of an effect size need to be considered simultaneously to be combined or compared. Apparently, there is a need for calculating their covariance, which however requires access to the individual data that may not be available to a researcher performing the analysis. We present a simple and efficient method for calculating the covariance of two correlated log-odds ratios. The method is very simple, is based on the well-known large sample approximations, can be applied using only data that are available in the published reports and more importantly, is very general, because it is shown to encompass several previously derived estimates (multiple outcomes, multiple treatments, dose–response models, mutually exclusive outcomes, genetic association studies) as special cases. By encompassing the previous approaches in a unified framework, the method allows easily deriving estimates for the covariance concerning problems that were not easy to be obtained otherwise. We show that the method can be used to derive the covariance of log-odds ratios from matched and unmatched case-control studies that use the same cases, a situation that has been addressed in the past only using individual data. Future applications of the method are discussed. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In many applications two correlated estimates of an effect size need to be considered simultaneously to be combined or compared. Apparently, there is a need for calculating their covariance, which however requires access to the individual data that may not be available to a researcher performing the analysis. We present a simple and efficient method for calculating the covariance of two correlated log-odds ratios. The method is very simple, is based on the well-known large sample approximations, can be applied using only data that are available in the published reports and more importantly, is very general, because it is shown to encompass several previously derived estimates (multiple outcomes, multiple treatments, dose–response models, mutually exclusive outcomes, genetic association studies) as special cases. By encompassing the previous approaches in a unified framework, the method allows easily deriving estimates for the covariance concerning problems that were not easy to be obtained otherwise. We show that the method can be used to derive the covariance of log-odds ratios from matched and unmatched case-control studies that use the same cases, a situation that has been addressed in the past only using individual data. Future applications of the method are discussed. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4464" xmlns="http://purl.org/rss/1.0/"><title>Estimating net survival: the importance of allowing for informative censoring</title><link>http://dx.doi.org/10.1002%2Fsim.4464</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating net survival: the importance of allowing for informative censoring</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Coraline Danieli</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Laurent Remontet</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Nadine Bossard</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Laurent Roche</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Aurélien Belot</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-26T06:53:09.44934-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4464</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4464</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4464</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Net survival, the one that would be observed if cancer were the only cause of death, is the most appropriate indicator to compare cancer mortality between areas or countries. Several parametric and non-parametric methods have been developed to estimate net survival, particularly when the cause of death is unknown. These methods are based either on the relative survival ratio or on the additive excess hazard model, the latter using the general population mortality hazard to estimate the excess mortality hazard (the hazard related to net survival). The present work used simulations to compare estimator abilities to estimate net survival in different settings such as the presence/absence of an age effect on the excess mortality hazard or on the potential time of follow-up, knowing that this covariate has an effect on the general population mortality hazard too. It showed that when age affected the excess mortality hazard, most estimators, including specific survival, were biased. Only two estimators were appropriate to estimate net survival. The first is based on a multivariable excess hazard model that includes age as covariate. The second is non-parametric and is based on the inverse probability weighting. These estimators take differently into account the informative censoring induced by the expected mortality process. The former offers great flexibility whereas the latter requires neither the assumption of a specific distribution nor a model-building strategy. Because of its simplicity and availability in commonly used software, the nonparametric estimator should be considered by cancer registries for population-based studies. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Net survival, the one that would be observed if cancer were the only cause of death, is the most appropriate indicator to compare cancer mortality between areas or countries. Several parametric and non-parametric methods have been developed to estimate net survival, particularly when the cause of death is unknown. These methods are based either on the relative survival ratio or on the additive excess hazard model, the latter using the general population mortality hazard to estimate the excess mortality hazard (the hazard related to net survival). The present work used simulations to compare estimator abilities to estimate net survival in different settings such as the presence/absence of an age effect on the excess mortality hazard or on the potential time of follow-up, knowing that this covariate has an effect on the general population mortality hazard too. It showed that when age affected the excess mortality hazard, most estimators, including specific survival, were biased. Only two estimators were appropriate to estimate net survival. The first is based on a multivariable excess hazard model that includes age as covariate. The second is non-parametric and is based on the inverse probability weighting. These estimators take differently into account the informative censoring induced by the expected mortality process. The former offers great flexibility whereas the latter requires neither the assumption of a specific distribution nor a model-building strategy. Because of its simplicity and availability in commonly used software, the nonparametric estimator should be considered by cancer registries for population-based studies. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4439" xmlns="http://purl.org/rss/1.0/"><title>Hierarchical Bayesian formulations for selecting variables in regression models</title><link>http://dx.doi.org/10.1002%2Fsim.4439</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Hierarchical Bayesian formulations for selecting variables in regression models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Veronika Rockova</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Emmanuel Lesaffre</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jolanda Luime</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Bob Löwenberg</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-25T02:14:08.11583-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4439</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4439</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4439</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The objective of finding a parsimonious representation of the observed data by a statistical model that is also capable of accurate prediction is commonplace in all domains of statistical applications. The parsimony of the solutions obtained by variable selection is usually counterbalanced by a limited prediction capacity. On the other hand, methodologies that assure high prediction accuracy usually lead to models that are neither simple nor easily interpretable. Regularization methodologies have proven to be useful in addressing both prediction and variable selection problems. The Bayesian approach to regularization constitutes a particularly attractive alternative as it is suitable for high-dimensional modeling, offers valid standard errors, and enables simultaneous estimation of regression coefficients and complexity parameters via computationally efficient MCMC techniques. Bayesian regularization falls within the versatile framework of Bayesian hierarchical models, which encompasses a variety of other approaches suited for variable selection such as spike and slab models and the <em>MC</em><sup>3</sup> approach. In this article, we review these Bayesian developments and evaluate their variable selection performance in a simulation study for the classical small <em>p</em> large <em>n</em> setting. The majority of the existing Bayesian methodology for variable selection deals only with classical linear regression. Here, we present two applications in the contexts of binary and survival regression, where the Bayesian approach was applied to select markers prognostically relevant for the development of rheumatoid arthritis and for overall survival in acute myeloid leukemia patients. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The objective of finding a parsimonious representation of the observed data by a statistical model that is also capable of accurate prediction is commonplace in all domains of statistical applications. The parsimony of the solutions obtained by variable selection is usually counterbalanced by a limited prediction capacity. On the other hand, methodologies that assure high prediction accuracy usually lead to models that are neither simple nor easily interpretable. Regularization methodologies have proven to be useful in addressing both prediction and variable selection problems. The Bayesian approach to regularization constitutes a particularly attractive alternative as it is suitable for high-dimensional modeling, offers valid standard errors, and enables simultaneous estimation of regression coefficients and complexity parameters via computationally efficient MCMC techniques. Bayesian regularization falls within the versatile framework of Bayesian hierarchical models, which encompasses a variety of other approaches suited for variable selection such as spike and slab models and the MC3 approach. In this article, we review these Bayesian developments and evaluate their variable selection performance in a simulation study for the classical small p large n setting. The majority of the existing Bayesian methodology for variable selection deals only with classical linear regression. Here, we present two applications in the contexts of binary and survival regression, where the Bayesian approach was applied to select markers prognostically relevant for the development of rheumatoid arthritis and for overall survival in acute myeloid leukemia patients. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4465" xmlns="http://purl.org/rss/1.0/"><title>The analysis of binary longitudinal data with time-dependent covariates</title><link>http://dx.doi.org/10.1002%2Fsim.4465</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">The analysis of binary longitudinal data with time-dependent covariates</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Matthew W. Guerra</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Justine Shults</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jay Amsterdam</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Thomas Ten-Have</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-13T06:40:55.339018-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4465</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4465</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4465</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>We consider longitudinal studies with binary outcomes that are measured repeatedly on subjects over time. The goal of our analysis was to fit a logistic model that relates the expected value of the outcomes with explanatory variables that are measured on each subject. However, additional care must be taken to adjust for the association between the repeated measurements on each subject. We propose a new maximum likelihood method for covariates that may be fixed or time varying. We also implement and make comparisons with two other approaches: generalized estimating equations, which may be more robust to misspecification of the true correlation structure, and alternating logistic regression, which models association via odds ratios that are subject to less restrictive constraints than are correlations. The proposed estimation procedure will yield consistent and asymptotically normal estimates of the regression and correlation parameters if the correlation on consecutive measurements on a subject is correctly specified. Simulations demonstrate that our approach can yield improved efficiency in estimation of the regression parameter; for equally spaced and complete data, the gains in efficiency were greatest for the parameter associated with a time-by-group interaction term and for stronger values of the correlation. For unequally spaced data and with dropout according to a missing-at-random mechanism, MARK1ML with correctly specified consecutive correlations yielded substantial improvements in terms of both bias and efficiency. We present an analysis to demonstrate application of the methods we consider. We also offer an R function for easy implementation of our approach. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>We consider longitudinal studies with binary outcomes that are measured repeatedly on subjects over time. The goal of our analysis was to fit a logistic model that relates the expected value of the outcomes with explanatory variables that are measured on each subject. However, additional care must be taken to adjust for the association between the repeated measurements on each subject. We propose a new maximum likelihood method for covariates that may be fixed or time varying. We also implement and make comparisons with two other approaches: generalized estimating equations, which may be more robust to misspecification of the true correlation structure, and alternating logistic regression, which models association via odds ratios that are subject to less restrictive constraints than are correlations. The proposed estimation procedure will yield consistent and asymptotically normal estimates of the regression and correlation parameters if the correlation on consecutive measurements on a subject is correctly specified. Simulations demonstrate that our approach can yield improved efficiency in estimation of the regression parameter; for equally spaced and complete data, the gains in efficiency were greatest for the parameter associated with a time-by-group interaction term and for stronger values of the correlation. For unequally spaced data and with dropout according to a missing-at-random mechanism, MARK1ML with correctly specified consecutive correlations yielded substantial improvements in terms of both bias and efficiency. We present an analysis to demonstrate application of the methods we consider. We also offer an R function for easy implementation of our approach. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4457" xmlns="http://purl.org/rss/1.0/"><title>Mixed effect Poisson log-linear models for clinical and epidemiological sleep hypnogram data</title><link>http://dx.doi.org/10.1002%2Fsim.4457</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Mixed effect Poisson log-linear models for clinical and epidemiological sleep hypnogram data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Bruce J. Swihart</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Brian S. Caffo</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ciprian M. Crainiceanu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Naresh M. Punjabi</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-13T01:37:08.983614-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4457</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4457</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4457</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Bayesian Poisson log-linear multilevel models scalable to epidemiological studies are proposed to investigate population variability in sleep state transition rates. Hierarchical random effects are used to account for pairings of subjects and repeated measures within those subjects, as comparing diseased with non-diseased subjects while minimizing bias is of importance. Essentially, non-parametric piecewise constant hazards are estimated and smoothed, allowing for time-varying covariates and segment of the night comparisons. The Bayesian Poisson regression is justified through a re-derivation of a classical algebraic likelihood equivalence of Poisson regression with a log(time) offset and survival regression assuming exponentially distributed survival times. Such re-derivation allows synthesis of two methods currently used to analyze sleep transition phenomena: stratified multi-state proportional hazards models and log-linear generalized estimating equations (GEE) models for transition counts. An example data set from the Sleep Heart Health Study is analyzed. Supplementary material includes the analyzed data set as well as the code for a reproducible analysis. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Bayesian Poisson log-linear multilevel models scalable to epidemiological studies are proposed to investigate population variability in sleep state transition rates. Hierarchical random effects are used to account for pairings of subjects and repeated measures within those subjects, as comparing diseased with non-diseased subjects while minimizing bias is of importance. Essentially, non-parametric piecewise constant hazards are estimated and smoothed, allowing for time-varying covariates and segment of the night comparisons. The Bayesian Poisson regression is justified through a re-derivation of a classical algebraic likelihood equivalence of Poisson regression with a log(time) offset and survival regression assuming exponentially distributed survival times. Such re-derivation allows synthesis of two methods currently used to analyze sleep transition phenomena: stratified multi-state proportional hazards models and log-linear generalized estimating equations (GEE) models for transition counts. An example data set from the Sleep Heart Health Study is analyzed. Supplementary material includes the analyzed data set as well as the code for a reproducible analysis. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4463" xmlns="http://purl.org/rss/1.0/"><title>Bayesian approach to predicting cancer incidence for an area without cancer registration by using cancer incidence data from nearby areas</title><link>http://dx.doi.org/10.1002%2Fsim.4463</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian approach to predicting cancer incidence for an area without cancer registration by using cancer incidence data from nearby areas</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ramon Clèries</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Josepa Ribes</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Maria Buxo</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Alberto Ameijide</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Rafael Marcos-Gragera</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jaume Galceran</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">José Miguel Martínez</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yutaka Yasui</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-11T10:15:14.057092-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4463</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4463</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4463</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>This paper compares three different methods for performing cancer incidence prediction in an area without a cancer registry under a Bayesian framework, using linear and log-linear age-period models with either age-specific slopes or a common slope across age groups. The three methods assume that a nearby area with a cancer registration has similar incidence and mortality patterns as the area of interest without a cancer registry where the cancer incidence prediction is carried out. The three methods differ in modeling strategies: (i) modeling the incidence rate directly; (ii) modeling the ratio of the number of incident cases to that of mortality cases; and (iii) modeling the difference between the incidence rate and the mortality rate. Strategy (iii) is a new approach in this type of projection. Empirical assessment is made using real data from the cancer registry of Tarragona, Spain, to predict cancer incidence in Girona, Spain, and vice versa. Predictions of short-term (3–4 years) incidence were made for 2001 in Tarragona using observed cancer incidence and mortality data for 1994–1998 from Girona. Short-term predictions were made for 2002 in Girona using Tarragona's 1994–1998 data. Additionally, long-term (10 years) incidence rate predictions were made for 2002 in Girona using data from Tarragona for the period 1985–1992. Our results suggest that extrapolating time-trends of incidence rates minus mortality rates may have the best predictive performance overall. These methods of population-level disease vincidence prediction are highly relevant to health care planning and policy decisions. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>This paper compares three different methods for performing cancer incidence prediction in an area without a cancer registry under a Bayesian framework, using linear and log-linear age-period models with either age-specific slopes or a common slope across age groups. The three methods assume that a nearby area with a cancer registration has similar incidence and mortality patterns as the area of interest without a cancer registry where the cancer incidence prediction is carried out. The three methods differ in modeling strategies: (i) modeling the incidence rate directly; (ii) modeling the ratio of the number of incident cases to that of mortality cases; and (iii) modeling the difference between the incidence rate and the mortality rate. Strategy (iii) is a new approach in this type of projection. Empirical assessment is made using real data from the cancer registry of Tarragona, Spain, to predict cancer incidence in Girona, Spain, and vice versa. Predictions of short-term (3–4 years) incidence were made for 2001 in Tarragona using observed cancer incidence and mortality data for 1994–1998 from Girona. Short-term predictions were made for 2002 in Girona using Tarragona's 1994–1998 data. Additionally, long-term (10 years) incidence rate predictions were made for 2002 in Girona using data from Tarragona for the period 1985–1992. Our results suggest that extrapolating time-trends of incidence rates minus mortality rates may have the best predictive performance overall. These methods of population-level disease vincidence prediction are highly relevant to health care planning and policy decisions. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4462" xmlns="http://purl.org/rss/1.0/"><title>A two-stage Bayesian design for co-development of new drugs and companion diagnostics</title><link>http://dx.doi.org/10.1002%2Fsim.4462</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A two-stage Bayesian design for co-development of new drugs and companion diagnostics</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Stella Wanjugu Karuri</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Richard Simon</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-11T10:05:52.039845-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4462</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4462</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4462</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Most new drug development in oncology is based on targeting specific molecules. Genomic profiles and deregulated drug targets vary from patient to patient making new treatments likely to benefit only a subset of patients traditionally grouped in the same clinical trials. Predictive biomarkers are being developed to identify patients who are most likely to benefit from a particular treatment; however, their biological basis is not always conclusive. The inclusion of marker-negative patients in a trial is therefore sometimes necessary for a more informative evaluation of the therapy. In this paper, we present a two-stage Bayesian design that includes both marker-positive and marker-negative patients in a clinical trial. We formulate a family of prior distributions that represent the degree of <em>a priori</em> confidence in the predictive biomarker. To avoid exposing patients to a treatment to which they may not be expected to benefit, we perform an interim analysis that may stop accrual of marker-negative patients or accrual of all patients. We demonstrate with simulations that the design and priors used control type I errors, give adequate power, and enable the early futility analysis of test-negative patients to be based on prior specification on the strength of evidence in the biomarker. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Most new drug development in oncology is based on targeting specific molecules. Genomic profiles and deregulated drug targets vary from patient to patient making new treatments likely to benefit only a subset of patients traditionally grouped in the same clinical trials. Predictive biomarkers are being developed to identify patients who are most likely to benefit from a particular treatment; however, their biological basis is not always conclusive. The inclusion of marker-negative patients in a trial is therefore sometimes necessary for a more informative evaluation of the therapy. In this paper, we present a two-stage Bayesian design that includes both marker-positive and marker-negative patients in a clinical trial. We formulate a family of prior distributions that represent the degree of a priori confidence in the predictive biomarker. To avoid exposing patients to a treatment to which they may not be expected to benefit, we perform an interim analysis that may stop accrual of marker-negative patients or accrual of all patients. We demonstrate with simulations that the design and priors used control type I errors, give adequate power, and enable the early futility analysis of test-negative patients to be based on prior specification on the strength of evidence in the biomarker. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4409" xmlns="http://purl.org/rss/1.0/"><title>The basic theory, diagnostic, and therapeutic system of traditional Chinese medicine and the challenges they bring to statistics</title><link>http://dx.doi.org/10.1002%2Fsim.4409</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">The basic theory, diagnostic, and therapeutic system of traditional Chinese medicine and the challenges they bring to statistics</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jingqing Hu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Baoyan Liu</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-01-11T10:00:29.126154-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4409</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4409</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4409</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Traditional Chinese medicine (TCM) has an unique theory system and abundant preventative and therapeutic methods. In recent years, TCM has gradually become the hot topic of application and research around the world. This paper introduces how TCM uses the theory of yin-yang and five-phase to explain the mechanism of balancing the function of human body, the methods of diagnosing, abundant therapeutic methods and technologies, and treating principles, analyzes the features of TCM, and points out some of the problems waitiing to be solved in TCM scientific researches and statistical analysis. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Traditional Chinese medicine (TCM) has an unique theory system and abundant preventative and therapeutic methods. In recent years, TCM has gradually become the hot topic of application and research around the world. This paper introduces how TCM uses the theory of yin-yang and five-phase to explain the mechanism of balancing the function of human body, the methods of diagnosing, abundant therapeutic methods and technologies, and treating principles, analyzes the features of TCM, and points out some of the problems waitiing to be solved in TCM scientific researches and statistical analysis. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4461" xmlns="http://purl.org/rss/1.0/"><title>Detecting case–control expression quantitative trait loci using locally most powerful or maximin robust rank tests</title><link>http://dx.doi.org/10.1002%2Fsim.4461</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Detecting case–control expression quantitative trait loci using locally most powerful or maximin robust rank tests</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ao Yuan</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jinfeng Xu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Qingqi Yue</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Gang Zheng</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-15T03:00:28.43077-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4461</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4461</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4461</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In testing genome-wide gene expression quantitative trait loci, efficiency robust statistical methods and their computational convenience are most relevant. For this purpose, we propose to use a modified locally most powerful rank test for the analysis of case–control expression data. This modified rank test statistic is computationally simple, robust for non-normally distributed expression data, and asymptotically locally most powerful. It depends on the specification of a location distribution form for data but is not sensitive to misspecifications. When such a location distribution form cannot be specified, we apply Gastwirth's maximin efficiency robust rank test to gene expression data to maximize the worst Pitman asymptotic relative efficiency among a family of location distributions. We conduct simulation studies to assess their performance and use an application to real data for illustration. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In testing genome-wide gene expression quantitative trait loci, efficiency robust statistical methods and their computational convenience are most relevant. For this purpose, we propose to use a modified locally most powerful rank test for the analysis of case–control expression data. This modified rank test statistic is computationally simple, robust for non-normally distributed expression data, and asymptotically locally most powerful. It depends on the specification of a location distribution form for data but is not sensitive to misspecifications. When such a location distribution form cannot be specified, we apply Gastwirth's maximin efficiency robust rank test to gene expression data to maximize the worst Pitman asymptotic relative efficiency among a family of location distributions. We conduct simulation studies to assess their performance and use an application to real data for illustration. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4443" xmlns="http://purl.org/rss/1.0/"><title>Performance of binary markers for censored failure time outcome: nonparametric approach based on proportions</title><link>http://dx.doi.org/10.1002%2Fsim.4443</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Performance of binary markers for censored failure time outcome: nonparametric approach based on proportions</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Laura Antolini</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Maria Grazia Valsecchi</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-12T13:07:31.719609-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4443</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4443</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4443</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>This work focuses on the assessment of the discrimination ability of a binary marker to identify patients that will relapse in time. We consider the cumulative definition of sensitivity and dynamic definition of specificity at a time horizon, that is, the probability of a positive marker in the population that will relapse (<em>cases</em>) and that will not relapse (<em>controls</em>). In the presence of censoring, sensitivity and specificity cannot be estimated by proportions because it is not known whether censored subjects should be considered as cases or controls. The solutions proposed do not enable to obtain asymptotic confidence intervals. We explore the use of inverse probability of censoring weighting/imputation (borrowed from the methodology used to correct for verification bias) to adjust the classification matrix for the presence of censoring. The adjustment based on weights estimated conditional on the marker turned to be equivalent to the adjustment based on imputation. These approaches, which address for the presence of marker-dependent censoring, showed a better performance than the adjustment based on weights estimated on the entire sample, even in the case of marker-independent censoring. We derived single intervals and confidence region for sensitivity and 1-specificity using the delta method. The confidence region is particularly useful for a binary marker because the marker has some ability to discriminate among cases and controls only if the region does not intersect the first quadrant bisector. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>This work focuses on the assessment of the discrimination ability of a binary marker to identify patients that will relapse in time. We consider the cumulative definition of sensitivity and dynamic definition of specificity at a time horizon, that is, the probability of a positive marker in the population that will relapse (cases) and that will not relapse (controls). In the presence of censoring, sensitivity and specificity cannot be estimated by proportions because it is not known whether censored subjects should be considered as cases or controls. The solutions proposed do not enable to obtain asymptotic confidence intervals. We explore the use of inverse probability of censoring weighting/imputation (borrowed from the methodology used to correct for verification bias) to adjust the classification matrix for the presence of censoring. The adjustment based on weights estimated conditional on the marker turned to be equivalent to the adjustment based on imputation. These approaches, which address for the presence of marker-dependent censoring, showed a better performance than the adjustment based on weights estimated on the entire sample, even in the case of marker-independent censoring. We derived single intervals and confidence region for sensitivity and 1-specificity using the delta method. The confidence region is particularly useful for a binary marker because the marker has some ability to discriminate among cases and controls only if the region does not intersect the first quadrant bisector. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4440" xmlns="http://purl.org/rss/1.0/"><title>How to deal with double partial verification when evaluating two index tests in relation to a reference test?</title><link>http://dx.doi.org/10.1002%2Fsim.4440</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">How to deal with double partial verification when evaluating two index tests in relation to a reference test?</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Nan Geloven</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Kimiko A. Broeze</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Brent C. Opmeer</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ben Willem Mol</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Aeilko H. Zwinderman</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-12T12:32:18.97215-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4440</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4440</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4440</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Research into the diagnostic accuracy of clinical tests is often hampered by single or double partial verification mechanisms, that is, not all patients have their disease status verified by a reference test, neither do all patients receive all tests under evaluation (index tests). We show methods that reduce verification bias introduced when omitting data from partially tested patients. Adjustment techniques are well established when there are no missing index tests and when the reference test is ‘missing at random’. However, in practice, index tests tend to be omitted, and the choice of applying a reference test may depend on unobserved variables related to disease status, that is, verification may be missing not at random (MNAR). We study double partial verification in a clinical example from reproductive medicine in which we analyse the diagnostic values of the chlamydia antibody test and the hysterosalpingography in relation to a diagnostic laparoscopy. First, we plot all possible combinations of sensitivity and specificity of both index tests in two test ignorance regions. Then, we construct models in which we impose different assumptions for the verification process. We allow for missing index tests, study the influence of patient characteristics and study the accuracy estimates if an MNAR mechanism would operate. It is shown that data on tests used in the diagnostic process of the same population are preferably studied jointly and that the influence of an MNAR verification process was limited in a clinical study where more than half of the patients did not have the reference test. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Research into the diagnostic accuracy of clinical tests is often hampered by single or double partial verification mechanisms, that is, not all patients have their disease status verified by a reference test, neither do all patients receive all tests under evaluation (index tests). We show methods that reduce verification bias introduced when omitting data from partially tested patients. Adjustment techniques are well established when there are no missing index tests and when the reference test is ‘missing at random’. However, in practice, index tests tend to be omitted, and the choice of applying a reference test may depend on unobserved variables related to disease status, that is, verification may be missing not at random (MNAR). We study double partial verification in a clinical example from reproductive medicine in which we analyse the diagnostic values of the chlamydia antibody test and the hysterosalpingography in relation to a diagnostic laparoscopy. First, we plot all possible combinations of sensitivity and specificity of both index tests in two test ignorance regions. Then, we construct models in which we impose different assumptions for the verification process. We allow for missing index tests, study the influence of patient characteristics and study the accuracy estimates if an MNAR mechanism would operate. It is shown that data on tests used in the diagnostic process of the same population are preferably studied jointly and that the influence of an MNAR verification process was limited in a clinical study where more than half of the patients did not have the reference test. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4447" xmlns="http://purl.org/rss/1.0/"><title>Preserving the allocation ratio at every allocation with biased coin randomization and minimization in studies with unequal allocation</title><link>http://dx.doi.org/10.1002%2Fsim.4447</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Preserving the allocation ratio at every allocation with biased coin randomization and minimization in studies with unequal allocation</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Olga M. Kuznetsova</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yevgen Tymofyeyev</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-12T12:25:42.381239-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4447</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4447</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4447</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The demand for unequal allocation in clinical trials is growing. Most commonly, the unequal allocation is achieved through permuted block randomization. However, other allocation procedures might be required to better approximate the allocation ratio in small samples, reduce the selection bias in open-label studies, or balance on baseline covariates. When these allocation procedures are generalized to unequal allocation, special care is to be taken to preserve the allocation ratio at every allocation step. This paper offers a way to expand the biased coin randomization to unequal allocation that preserves the allocation ratio at every allocation. The suggested expansion works with biased coin randomization that balances only on treatment group totals and with covariate-adaptive procedures that use a random biased coin element at every allocation. Balancing properties of the allocation ratio preserving biased coin randomization and minimization are described through simulations. It is demonstrated that these procedures are asymptotically protected against the shift in the rerandomization distribution identified for some examples of minimization with 1:2 allocation. The asymptotic shift in the rerandomization distribution of the difference in treatment means for an arbitrary unequal allocation procedure is explicitly derived in the paper. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The demand for unequal allocation in clinical trials is growing. Most commonly, the unequal allocation is achieved through permuted block randomization. However, other allocation procedures might be required to better approximate the allocation ratio in small samples, reduce the selection bias in open-label studies, or balance on baseline covariates. When these allocation procedures are generalized to unequal allocation, special care is to be taken to preserve the allocation ratio at every allocation step. This paper offers a way to expand the biased coin randomization to unequal allocation that preserves the allocation ratio at every allocation. The suggested expansion works with biased coin randomization that balances only on treatment group totals and with covariate-adaptive procedures that use a random biased coin element at every allocation. Balancing properties of the allocation ratio preserving biased coin randomization and minimization are described through simulations. It is demonstrated that these procedures are asymptotically protected against the shift in the rerandomization distribution identified for some examples of minimization with 1:2 allocation. The asymptotic shift in the rerandomization distribution of the difference in treatment means for an arbitrary unequal allocation procedure is explicitly derived in the paper. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4416" xmlns="http://purl.org/rss/1.0/"><title>Bayesian-adjusted R2 for the meta-analytic evaluation of surrogate time-to-event endpoints in clinical trials</title><link>http://dx.doi.org/10.1002%2Fsim.4416</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian-adjusted R2 for the meta-analytic evaluation of surrogate time-to-event endpoints in clinical trials</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lindsay Anne Renfro</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Qian Shi</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Daniel J. Sargent</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Bradley P. Carlin</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-09T09:34:55.042136-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4416</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4416</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4416</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>A two-stage model for evaluating both trial-level and patient-level surrogacy of correlated time-to-event endpoints has been introduced, using patient-level data when multiple clinical trials are available. However, the associated maximum likelihood approach often suffers from numerical problems when different baseline hazards among trials and imperfect estimation of treatment effects are assumed. To address this issue, we propose performing the second-stage, trial-level evaluation of potential surrogates within a Bayesian framework, where we may naturally borrow information across trials while maintaining these realistic assumptions. Posterior distributions on surrogacy measures of interest may then be used to compare measures or make decisions regarding the candidacy of a specific endpoint. We perform a simulation study to investigate differences in estimation performance between traditional maximum likelihood and new Bayesian representations of common meta-analytic surrogacy measures, while assessing sensitivity to data characteristics such as number of trials, trial size, and amount of censoring. Furthermore, we present both frequentist and Bayesian trial-level surrogacy evaluations of time to recurrence for overall survival in two meta-analyses of adjuvant therapy trials in colon cancer. With these results, we recommend Bayesian evaluation as an attractive and numerically stable alternative in the multitrial assessment of potential surrogate endpoints. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>A two-stage model for evaluating both trial-level and patient-level surrogacy of correlated time-to-event endpoints has been introduced, using patient-level data when multiple clinical trials are available. However, the associated maximum likelihood approach often suffers from numerical problems when different baseline hazards among trials and imperfect estimation of treatment effects are assumed. To address this issue, we propose performing the second-stage, trial-level evaluation of potential surrogates within a Bayesian framework, where we may naturally borrow information across trials while maintaining these realistic assumptions. Posterior distributions on surrogacy measures of interest may then be used to compare measures or make decisions regarding the candidacy of a specific endpoint. We perform a simulation study to investigate differences in estimation performance between traditional maximum likelihood and new Bayesian representations of common meta-analytic surrogacy measures, while assessing sensitivity to data characteristics such as number of trials, trial size, and amount of censoring. Furthermore, we present both frequentist and Bayesian trial-level surrogacy evaluations of time to recurrence for overall survival in two meta-analyses of adjuvant therapy trials in colon cancer. With these results, we recommend Bayesian evaluation as an attractive and numerically stable alternative in the multitrial assessment of potential surrogate endpoints. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4437" xmlns="http://purl.org/rss/1.0/"><title>Sufficient dimension reduction for longitudinally measured predictors</title><link>http://dx.doi.org/10.1002%2Fsim.4437</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Sufficient dimension reduction for longitudinally measured predictors</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ruth M. Pfeiffer</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Liliana Forzani</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Efstathia Bura</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-09T09:29:05.352152-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4437</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4437</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4437</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>We propose a method to combine several predictors (markers) that are measured repeatedly over time into a composite marker score without assuming a model and only requiring a mild condition on the predictor distribution. Assuming that the first and second moments of the predictors can be decomposed into a time and a marker component via a Kronecker product structure that accommodates the longitudinal nature of the predictors, we develop first-moment sufficient dimension reduction techniques to replace the original markers with linear transformations that contain sufficient information for the regression of the predictors on the outcome. These linear combinations can then be combined into a score that has better predictive performance than a score built under a general model that ignores the longitudinal structure of the data. Our methods can be applied to either continuous or categorical outcome measures. In simulations, we focus on binary outcomes and show that our method outperforms existing alternatives by using the AUC, the area under the receiver–operator characteristics (ROC) curve, as a summary measure of the discriminatory ability of a single continuous diagnostic marker for binary disease outcomes. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>We propose a method to combine several predictors (markers) that are measured repeatedly over time into a composite marker score without assuming a model and only requiring a mild condition on the predictor distribution. Assuming that the first and second moments of the predictors can be decomposed into a time and a marker component via a Kronecker product structure that accommodates the longitudinal nature of the predictors, we develop first-moment sufficient dimension reduction techniques to replace the original markers with linear transformations that contain sufficient information for the regression of the predictors on the outcome. These linear combinations can then be combined into a score that has better predictive performance than a score built under a general model that ignores the longitudinal structure of the data. Our methods can be applied to either continuous or categorical outcome measures. In simulations, we focus on binary outcomes and show that our method outperforms existing alternatives by using the AUC, the area under the receiver–operator characteristics (ROC) curve, as a summary measure of the discriminatory ability of a single continuous diagnostic marker for binary disease outcomes. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4417" xmlns="http://purl.org/rss/1.0/"><title>Data processing and analysis in real-world traditional Chinese medicine clinical data: challenges and approaches</title><link>http://dx.doi.org/10.1002%2Fsim.4417</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Data processing and analysis in real-world traditional Chinese medicine clinical data: challenges and approaches</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Baoyan Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xuezhong Zhou</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yinhui Wang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jingqing Hu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Liyun He</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Runshun Zhang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Shibo Chen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yufeng Guo</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-09T09:23:21.307122-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4417</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4417</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4417</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Traditional Chinese medicine (TCM) is a clinical-based discipline in which real-world clinical practice plays a significant role for both the development of clinical therapy and theoretical research. The large-scale clinical data generated during the daily clinical operations of TCM provide a highly valuable knowledge source for clinical decision making. Secondary analysis of these data would be a vital task for TCM clinical studies before the randomised controlled trials are conducted. In this article, we discuss the challenges and issues, such as structured data curation, data preprocessing and quality, large-scale data management and complex data analysis requirements, in the data processing and analysis of real-world TCM clinical data. Furthermore, we also discuss related state-of-the-art research and solutions in China. We have shown that the clinical data warehouse based on the collection of structured electronic medical record data and clinical terminology would be a promising approach for generating clinical hypotheses and helping the discovery of clinical knowledge from large-scale real-world TCM clinical data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Traditional Chinese medicine (TCM) is a clinical-based discipline in which real-world clinical practice plays a significant role for both the development of clinical therapy and theoretical research. The large-scale clinical data generated during the daily clinical operations of TCM provide a highly valuable knowledge source for clinical decision making. Secondary analysis of these data would be a vital task for TCM clinical studies before the randomised controlled trials are conducted. In this article, we discuss the challenges and issues, such as structured data curation, data preprocessing and quality, large-scale data management and complex data analysis requirements, in the data processing and analysis of real-world TCM clinical data. Furthermore, we also discuss related state-of-the-art research and solutions in China. We have shown that the clinical data warehouse based on the collection of structured electronic medical record data and clinical terminology would be a promising approach for generating clinical hypotheses and helping the discovery of clinical knowledge from large-scale real-world TCM clinical data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4435" xmlns="http://purl.org/rss/1.0/"><title>Global hypothesis testing for high-dimensional repeated measures outcomes</title><link>http://dx.doi.org/10.1002%2Fsim.4435</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Global hypothesis testing for high-dimensional repeated measures outcomes</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yueh-Yun Chi</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Matthew Gribbin</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yvonne Lamers</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jesse F. Gregory</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Keith E. Muller</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-09T09:14:02.576858-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4435</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4435</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4435</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>High-throughput technology in metabolomics, genomics, and proteomics gives rise to high dimension, low sample size data when the number of metabolites, genes, or proteins exceeds the sample size. For a limited class of designs, the classic ‘univariate approach’ for Gaussian repeated measures can provide a reasonable global hypothesis test. We derive new tests that not only accurately allow more variables than subjects, but also give valid analyses for data with complex between-subject and within-subject designs. Our derivations capitalize on the dual of the error covariance matrix, which is nonsingular when the number of variables exceeds the sample size, to ensure correct statistical inference and enhance computational efficiency. Simulation studies demonstrate that the new tests accurately control Type I error rate and have reasonable power even with a handful of subjects and a thousand outcome variables. We apply the new methods to the study of metabolic consequences of vitamin B6 deficiency. Free software implementing the new methods applies to a wide range of designs, including one group pre-intervention and post-intervention comparisons, multiple parallel group comparisons with one-way or factorial designs, and the adjustment and evaluation of covariate effects. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>High-throughput technology in metabolomics, genomics, and proteomics gives rise to high dimension, low sample size data when the number of metabolites, genes, or proteins exceeds the sample size. For a limited class of designs, the classic ‘univariate approach’ for Gaussian repeated measures can provide a reasonable global hypothesis test. We derive new tests that not only accurately allow more variables than subjects, but also give valid analyses for data with complex between-subject and within-subject designs. Our derivations capitalize on the dual of the error covariance matrix, which is nonsingular when the number of variables exceeds the sample size, to ensure correct statistical inference and enhance computational efficiency. Simulation studies demonstrate that the new tests accurately control Type I error rate and have reasonable power even with a handful of subjects and a thousand outcome variables. We apply the new methods to the study of metabolic consequences of vitamin B6 deficiency. Free software implementing the new methods applies to a wide range of designs, including one group pre-intervention and post-intervention comparisons, multiple parallel group comparisons with one-way or factorial designs, and the adjustment and evaluation of covariate effects. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4419" xmlns="http://purl.org/rss/1.0/"><title>A Bayesian order-restricted model for hormonal dynamics during menstrual cycles of healthy women</title><link>http://dx.doi.org/10.1002%2Fsim.4419</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A Bayesian order-restricted model for hormonal dynamics during menstrual cycles of healthy women</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Anindya Roy</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Michelle Danaher</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sunni L. Mumford</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhen Chen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-07T05:44:00.818991-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4419</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4419</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4419</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>We propose a Bayesian framework for analyzing multivariate linear mixed effect models with linear constraints on the fixed effect parameters. The procedure can incorporate both firm and soft restrictions on the parameters and Bayesian model selection for the random effects. The framework is used to analyze data from the BioCycle study. One of the main objectives of the BioCycle study is to investigate the association between markers of oxidative stress and hormone levels during menstrual cycles of healthy women. Contrary to the popular belief that ovarian hormones are negatively associated with level of F <sub>2</sub>-isoprostanes, a known marker for oxidative stress, our analysis finds a positive association between ovarian hormone levels and isoprostane levels. The positive association corroborates the findings from a previous analysis of the BioCycle data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>We propose a Bayesian framework for analyzing multivariate linear mixed effect models with linear constraints on the fixed effect parameters. The procedure can incorporate both firm and soft restrictions on the parameters and Bayesian model selection for the random effects. The framework is used to analyze data from the BioCycle study. One of the main objectives of the BioCycle study is to investigate the association between markers of oxidative stress and hormone levels during menstrual cycles of healthy women. Contrary to the popular belief that ovarian hormones are negatively associated with level of F 2-isoprostanes, a known marker for oxidative stress, our analysis finds a positive association between ovarian hormone levels and isoprostane levels. The positive association corroborates the findings from a previous analysis of the BioCycle data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4418" xmlns="http://purl.org/rss/1.0/"><title>Estimating incidence rates using exact or interval-censored data with an application to hospital-acquired infections</title><link>http://dx.doi.org/10.1002%2Fsim.4418</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating incidence rates using exact or interval-censored data with an application to hospital-acquired infections</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lisha Deng</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Peter J. Diggle</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">John Cheesbrough</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-12-07T05:03:27.793046-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4418</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4418</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4418</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Health-care providers in the UK and elsewhere are required to maintain records of incidents relating to patient safety, including the date and time of each incident. However, for reporting and analysis, the resulting data are typically grouped into discrete time intervals, for example, weekly or monthly counts. The grouping represents a potential loss of information for estimating variations in incidence over time. We use a Poisson point process model to quantify this loss of information. We also suggest some diagnostic procedures for checking the goodness of fit of the Poisson model. Finally, we apply the model to the data on hospital-acquired methicillin-resistant <em>Staphylococcus aureus</em> infections in two hospitals in the north of England. We find that, in one of the hospitals, the estimated incidence decreased by a factor of approximately 2.3 over a 7-year period from 0.323 to 0.097 cases per day per 1000 beds, whereas in the other, the estimated incidence showed only a small and nonsignificant decrease over the same period from 0.137 to 0.131. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Health-care providers in the UK and elsewhere are required to maintain records of incidents relating to patient safety, including the date and time of each incident. However, for reporting and analysis, the resulting data are typically grouped into discrete time intervals, for example, weekly or monthly counts. The grouping represents a potential loss of information for estimating variations in incidence over time. We use a Poisson point process model to quantify this loss of information. We also suggest some diagnostic procedures for checking the goodness of fit of the Poisson model. Finally, we apply the model to the data on hospital-acquired methicillin-resistant Staphylococcus aureus infections in two hospitals in the north of England. We find that, in one of the hospitals, the estimated incidence decreased by a factor of approximately 2.3 over a 7-year period from 0.323 to 0.097 cases per day per 1000 beds, whereas in the other, the estimated incidence showed only a small and nonsignificant decrease over the same period from 0.137 to 0.131. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4343" xmlns="http://purl.org/rss/1.0/"><title>Comparison of alternative models for linking drug exposure with adverse effects</title><link>http://dx.doi.org/10.1002%2Fsim.4343</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Comparison of alternative models for linking drug exposure with adverse effects</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Michal Abrahamowicz</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Marie-Eve Beauchamp</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Marie-Pierre Sylvestre</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-17T06:53:42.900303-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4343</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4343</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4343</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Pharmacoepidemiology investigates associations between time-varying medication use/dose and risk of adverse events. Applied research typically relies on a priori chosen simple conventional models, such as current dose or any use in the past 3 months. However, different models imply different risk predictions, and only one model can be etiologically correct in any specific applications. We first formally defined several candidate models mapping the time vector of past drug doses (<b><em>X</em></b> (<em>t</em>), <em>t</em>  =  1, … ,<em>u</em>) into the value of a time-varying exposure metric <em>M</em>(<em>u</em>) at current time <em>u</em>. In addition to conventional one-parameter models, we considered two-parameter models accounting for recent dose increase or withdrawal and a flexible spline-based weighted cumulative exposure (WCE) model that defines <em>M</em>(<em>u</em>) as the weighted sum of past doses. In simulations, we generated event times assuming one of the models was correct and then analyzed the data with all candidate models. We demonstrated that the minimum AIC criterion is able to identify the correct model as the best-fitting model or one of the equivalent (within 4 AIC points of the minimum) models in a vast majority of simulated samples, especially with 500 or more events. We also showed how relying on an incorrect a priori chosen model may largely reduce the power to test for an association. Finally, we demonstrated how the flexible WCE estimates may help with model diagnostics even if the correct model is not WCE. We illustrated the practical advantages of AIC-based a posteriori model selection and WCE modeling in a real-life pharmacoepidemiology example. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Pharmacoepidemiology investigates associations between time-varying medication use/dose and risk of adverse events. Applied research typically relies on a priori chosen simple conventional models, such as current dose or any use in the past 3 months. However, different models imply different risk predictions, and only one model can be etiologically correct in any specific applications. We first formally defined several candidate models mapping the time vector of past drug doses (X (t), t  =  1, … ,u) into the value of a time-varying exposure metric M(u) at current time u. In addition to conventional one-parameter models, we considered two-parameter models accounting for recent dose increase or withdrawal and a flexible spline-based weighted cumulative exposure (WCE) model that defines M(u) as the weighted sum of past doses. In simulations, we generated event times assuming one of the models was correct and then analyzed the data with all candidate models. We demonstrated that the minimum AIC criterion is able to identify the correct model as the best-fitting model or one of the equivalent (within 4 AIC points of the minimum) models in a vast majority of simulated samples, especially with 500 or more events. We also showed how relying on an incorrect a priori chosen model may largely reduce the power to test for an association. Finally, we demonstrated how the flexible WCE estimates may help with model diagnostics even if the correct model is not WCE. We illustrated the practical advantages of AIC-based a posteriori model selection and WCE modeling in a real-life pharmacoepidemiology example. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4359" xmlns="http://purl.org/rss/1.0/"><title>Outcome-dependent sampling for longitudinal binary response data based on a time-varying auxiliary variable</title><link>http://dx.doi.org/10.1002%2Fsim.4359</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Outcome-dependent sampling for longitudinal binary response data based on a time-varying auxiliary variable</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jonathan S. Schildcrout</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sunni L. Mumford</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhen Chen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Patrick J. Heagerty</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Paul J. Rathouz</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-16T05:16:10.752435-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4359</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4359</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4359</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Outcome-dependent sampling (ODS) study designs are commonly implemented with rare diseases or when prospective studies are infeasible. In longitudinal data settings, when a repeatedly measured binary response is rare, an ODS design can be highly efficient for maximizing statistical information subject to resource limitations that prohibit covariate ascertainment of all observations. This manuscript details an ODS design where individual observations are sampled with probabilities determined by an inexpensive, time-varying auxiliary variable that is related but is not equal to the response. With the goal of validly estimating marginal model parameters based on the resulting biased sample, we propose a semi-parametric, <em>sequential offsetted logistic regressions</em> (SOLR) approach. The SOLR strategy first estimates the relationship between the auxiliary variable and the response and covariate data by using an offsetted logistic regression analysis where the offset is used to adjust for the biased design. Results from the auxiliary variable model are then combined with the known or estimated sampling probabilities to formulate a second offset that is used to correct for the biased design in the ultimate target model relating the longitudinal binary response to covariates. Because the target model offset is estimated with SOLR, we detail asymptotic standard error estimates that account for uncertainty associated with the auxiliary variable model. Motivated by an analysis of the BioCycle Study (Gaskins et al., Effect of daily fiber intake on reproductive function: the BioCycle Study. <em>American Journal of Clinical Nutrition</em> 2009; 90(4): 1061–1069) that aims to describe the relationship between reproductive health (determined by luteinizing hormone levels) and fiber consumption, we examine properties of SOLR estimators and compare them with other common approaches. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Outcome-dependent sampling (ODS) study designs are commonly implemented with rare diseases or when prospective studies are infeasible. In longitudinal data settings, when a repeatedly measured binary response is rare, an ODS design can be highly efficient for maximizing statistical information subject to resource limitations that prohibit covariate ascertainment of all observations. This manuscript details an ODS design where individual observations are sampled with probabilities determined by an inexpensive, time-varying auxiliary variable that is related but is not equal to the response. With the goal of validly estimating marginal model parameters based on the resulting biased sample, we propose a semi-parametric, sequential offsetted logistic regressions (SOLR) approach. The SOLR strategy first estimates the relationship between the auxiliary variable and the response and covariate data by using an offsetted logistic regression analysis where the offset is used to adjust for the biased design. Results from the auxiliary variable model are then combined with the known or estimated sampling probabilities to formulate a second offset that is used to correct for the biased design in the ultimate target model relating the longitudinal binary response to covariates. Because the target model offset is estimated with SOLR, we detail asymptotic standard error estimates that account for uncertainty associated with the auxiliary variable model. Motivated by an analysis of the BioCycle Study (Gaskins et al., Effect of daily fiber intake on reproductive function: the BioCycle Study. American Journal of Clinical Nutrition 2009; 90(4): 1061–1069) that aims to describe the relationship between reproductive health (determined by luteinizing hormone levels) and fiber consumption, we examine properties of SOLR estimators and compare them with other common approaches. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4385" xmlns="http://purl.org/rss/1.0/"><title>Interpretability and importance of functionals in competing risks and multistate models</title><link>http://dx.doi.org/10.1002%2Fsim.4385</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Interpretability and importance of functionals in competing risks and multistate models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Per Kragh Andersen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Niels Keiding</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-14T02:19:04.89522-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4385</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4385</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4385</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The basic parameters in both survival analysis and more general multistate models, including the competing risks model and the illness–death model, are the transition hazards. It is often necessary to supplement the analysis of such models with other model parameters, which are all functionals of the transition hazards. Unfortunately, not all such functionals are equally meaningful in practical contexts, even though they may be mathematically well defined. We have found it useful to check whether the functionals satisfy three simple principles, which may be used as criteria for practical interpretability. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The basic parameters in both survival analysis and more general multistate models, including the competing risks model and the illness–death model, are the transition hazards. It is often necessary to supplement the analysis of such models with other model parameters, which are all functionals of the transition hazards. Unfortunately, not all such functionals are equally meaningful in practical contexts, even though they may be mathematically well defined. We have found it useful to check whether the functionals satisfy three simple principles, which may be used as criteria for practical interpretability. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4387" xmlns="http://purl.org/rss/1.0/"><title>Towards power and sample size calculations for the comparison of two groups of patients with item response theory models</title><link>http://dx.doi.org/10.1002%2Fsim.4387</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Towards power and sample size calculations for the comparison of two groups of patients with item response theory models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jean-Benoit Hardouin</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sarah Amri</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Mohand-Larbi Feddag</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Véronique Sébille</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-08T22:46:00.669238-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4387</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4387</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4387</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Evaluation of patient-reported outcomes (PRO) is increasingly performed in health sciences. PRO differs from other measurements because such patient characteristics cannot be directly observed. Item response theory (IRT) is an attractive way for PRO analysis. However, in the framework of IRT, sample size justification is rarely provided or ignores the fact that PRO measures are latent variables with the use of formulas developed for observed variables. It might therefore be inappropriate and might provide inadequately sized studies. The objective was to develop valid sample size methodology for the comparison of PRO in two groups of patients using IRT. The proposed approach takes into account questionnaire's items parameters, the difference of the latent variables means, and its variance whose derivation is approximated using Cramer–Rao bound (CRB). We also computed the associated power. We realized a simulation study taking into account sample size, number of items, and value of the group effect. We compared power obtained from CRB with the one obtained from simulations (SIM) and with the power based on observed variables (OBS). For a given sample size, powers using CRB and SIM were similar and always lower than OBS. We observed a strong impact of the number of items for CRB and SIM, the power increasing with the questionnaire's length but not for OBS. In the context of latent variables, it seems important to use an adapted sample size formula because the formula developed for observed variables seems to be inadequate and leads to an underestimated study size. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Evaluation of patient-reported outcomes (PRO) is increasingly performed in health sciences. PRO differs from other measurements because such patient characteristics cannot be directly observed. Item response theory (IRT) is an attractive way for PRO analysis. However, in the framework of IRT, sample size justification is rarely provided or ignores the fact that PRO measures are latent variables with the use of formulas developed for observed variables. It might therefore be inappropriate and might provide inadequately sized studies. The objective was to develop valid sample size methodology for the comparison of PRO in two groups of patients using IRT. The proposed approach takes into account questionnaire's items parameters, the difference of the latent variables means, and its variance whose derivation is approximated using Cramer–Rao bound (CRB). We also computed the associated power. We realized a simulation study taking into account sample size, number of items, and value of the group effect. We compared power obtained from CRB with the one obtained from simulations (SIM) and with the power based on observed variables (OBS). For a given sample size, powers using CRB and SIM were similar and always lower than OBS. We observed a strong impact of the number of items for CRB and SIM, the power increasing with the questionnaire's length but not for OBS. In the context of latent variables, it seems important to use an adapted sample size formula because the formula developed for observed variables seems to be inadequate and leads to an underestimated study size. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4404" xmlns="http://purl.org/rss/1.0/"><title>Spatial scan statistics with overdispersion</title><link>http://dx.doi.org/10.1002%2Fsim.4404</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Spatial scan statistics with overdispersion</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Tonglin Zhang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zuoyi Zhang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ge Lin</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-03T10:49:04.903055-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4404</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4404</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4404</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The spatial scan statistic has been widely used in spatial disease surveillance and spatial cluster detection for more than a decade. However, overdispersion often presents in real-world data, causing not only violation of the Poisson assumption but also excessive type I errors or false alarms. In order to account for overdispersion, we extend the Poisson-based spatial scan test to a quasi-Poisson-based test. The simulation shows that the proposed method can substantially reduce type I error probabilities in the presence of overdispersion. In a case study of infant mortality in Jiangxi, China, both tests detect a cluster; however, a secondary cluster is identified by only the Poisson-based test. It is recommended that a cluster detected by the Poisson-based scan test should be interpreted with caution when it is not confirmed by the quasi-Poisson-based test. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The spatial scan statistic has been widely used in spatial disease surveillance and spatial cluster detection for more than a decade. However, overdispersion often presents in real-world data, causing not only violation of the Poisson assumption but also excessive type I errors or false alarms. In order to account for overdispersion, we extend the Poisson-based spatial scan test to a quasi-Poisson-based test. The simulation shows that the proposed method can substantially reduce type I error probabilities in the presence of overdispersion. In a case study of infant mortality in Jiangxi, China, both tests detect a cluster; however, a secondary cluster is identified by only the Poisson-based test. It is recommended that a cluster detected by the Poisson-based scan test should be interpreted with caution when it is not confirmed by the quasi-Poisson-based test. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4357" xmlns="http://purl.org/rss/1.0/"><title>Optimal sample sizes for phase II clinical trials and pilot studies</title><link>http://dx.doi.org/10.1002%2Fsim.4357</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Optimal sample sizes for phase II clinical trials and pilot studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Nigel Stallard</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-03T01:33:19.69895-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4357</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4357</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4357</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Methodology for sample size calculation for phase III clinical trials is well established and widely used. In contrast, for earlier phase clinical trials or pilot studies, although there is an acceptance that the methods used for phase III trials are not appropriate, there is little consensus over methods that should be used. This paper explores this problem from a Bayesian decision-theoretic perspective. The aim is to obtain sample sizes that would be appropriate for studies funded by a large funder such as a public sector body or major pharmaceutical company. The sample sizes obtained are optimal in that they minimise the average number of patients required per successfully identified effective therapy or equivalently maximise the number of effective therapies successfully identified over a long period.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>It is indicated that the number of patients included in a phase II clinical trial should be approximately 0.03 times that planned to be included in the phase III study. This is similar to that proposed by other researchers in this area, though rather smaller than actually used for many phase II trials. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Methodology for sample size calculation for phase III clinical trials is well established and widely used. In contrast, for earlier phase clinical trials or pilot studies, although there is an acceptance that the methods used for phase III trials are not appropriate, there is little consensus over methods that should be used. This paper explores this problem from a Bayesian decision-theoretic perspective. The aim is to obtain sample sizes that would be appropriate for studies funded by a large funder such as a public sector body or major pharmaceutical company. The sample sizes obtained are optimal in that they minimise the average number of patients required per successfully identified effective therapy or equivalently maximise the number of effective therapies successfully identified over a long period.It is indicated that the number of patients included in a phase II clinical trial should be approximately 0.03 times that planned to be included in the phase III study. This is similar to that proposed by other researchers in this area, though rather smaller than actually used for many phase II trials. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4389" xmlns="http://purl.org/rss/1.0/"><title>Local sparse bump hunting reveals molecular heterogeneity of colon tumors</title><link>http://dx.doi.org/10.1002%2Fsim.4389</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Local sparse bump hunting reveals molecular heterogeneity of colon tumors</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jean-Eudes Dazard</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">J. Sunil Rao</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sanford Markowitz</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-11-03T00:44:47.394118-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4389</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4389</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4389</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The question of molecular heterogeneity and of tumoral phenotype in cancer remains unresolved. To understand the underlying molecular basis of this phenomenon, we analyzed genome-wide expression data of colon cancer metastasis samples, as these tumors are the most advanced and hence would be anticipated to be the most likely heterogeneous group of tumors, potentially exhibiting the maximum amount of genetic heterogeneity. Casting a statistical net around such a complex problem proves difficult because of the high dimensionality and multicollinearity of the gene expression space, combined with the fact that genes act in concert with one another and that not all genes surveyed might be involved. We devise a strategy to identify distinct subgroups of samples and determine the genetic/molecular signature that defines them. This involves use of the local sparse bump hunting algorithm, which provides a much more optimal and biologically faithful transformed space within which to search for bumps. In addition, thanks to the variable selection feature of the algorithm, we derived a novel sparse gene expression signature, which appears to divide all colon cancer patients into two populations: a population whose expression pattern can be molecularly encompassed within the bump and an outlier population that cannot be. Although all patients within any given stage of the disease, including the metastatic group, appear clinically homogeneous, our procedure revealed two subgroups in each stage with distinct genetic/molecular profiles. We also discuss implications of such a finding in terms of early detection, diagnosis and prognosis. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The question of molecular heterogeneity and of tumoral phenotype in cancer remains unresolved. To understand the underlying molecular basis of this phenomenon, we analyzed genome-wide expression data of colon cancer metastasis samples, as these tumors are the most advanced and hence would be anticipated to be the most likely heterogeneous group of tumors, potentially exhibiting the maximum amount of genetic heterogeneity. Casting a statistical net around such a complex problem proves difficult because of the high dimensionality and multicollinearity of the gene expression space, combined with the fact that genes act in concert with one another and that not all genes surveyed might be involved. We devise a strategy to identify distinct subgroups of samples and determine the genetic/molecular signature that defines them. This involves use of the local sparse bump hunting algorithm, which provides a much more optimal and biologically faithful transformed space within which to search for bumps. In addition, thanks to the variable selection feature of the algorithm, we derived a novel sparse gene expression signature, which appears to divide all colon cancer patients into two populations: a population whose expression pattern can be molecularly encompassed within the bump and an outlier population that cannot be. Although all patients within any given stage of the disease, including the metastatic group, appear clinically homogeneous, our procedure revealed two subgroups in each stage with distinct genetic/molecular profiles. We also discuss implications of such a finding in terms of early detection, diagnosis and prognosis. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4371" xmlns="http://purl.org/rss/1.0/"><title>An evaluation of penalised survival methods for developing prognostic models with rare events</title><link>http://dx.doi.org/10.1002%2Fsim.4371</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">An evaluation of penalised survival methods for developing prognostic models with rare events</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">G. Ambler</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">S. Seaman</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">R. Z. Omar</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-14T01:11:37.529569-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4371</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4371</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4371</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Prognostic models for survival outcomes are often developed by fitting standard survival regression models, such as the Cox proportional hazards model, to representative datasets. However, these models can be unreliable if the datasets contain few events, which may be the case if either the disease or the event of interest is rare. Specific problems include predictions that are too extreme, and poor discrimination between low-risk and high-risk patients. The objective of this paper is to evaluate three existing penalised methods that have been proposed to improve predictive accuracy. In particular, ridge, lasso and the garotte, which use penalised maximum likelihood to shrink coefficient estimates and in some cases omit predictors entirely, are assessed using simulated data derived from two clinical datasets. The predictions obtained using these methods are compared with those from Cox models fitted using standard maximum likelihood. The simulation results suggest that Cox models fitted using maximum likelihood can perform poorly when there are few events, and that significant improvements are possible by taking a penalised modelling approach. The ridge method generally performed the best, although lasso is recommended if variable selection is required. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Prognostic models for survival outcomes are often developed by fitting standard survival regression models, such as the Cox proportional hazards model, to representative datasets. However, these models can be unreliable if the datasets contain few events, which may be the case if either the disease or the event of interest is rare. Specific problems include predictions that are too extreme, and poor discrimination between low-risk and high-risk patients. The objective of this paper is to evaluate three existing penalised methods that have been proposed to improve predictive accuracy. In particular, ridge, lasso and the garotte, which use penalised maximum likelihood to shrink coefficient estimates and in some cases omit predictors entirely, are assessed using simulated data derived from two clinical datasets. The predictions obtained using these methods are compared with those from Cox models fitted using standard maximum likelihood. The simulation results suggest that Cox models fitted using maximum likelihood can perform poorly when there are few events, and that significant improvements are possible by taking a penalised modelling approach. The ridge method generally performed the best, although lasso is recommended if variable selection is required. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4370" xmlns="http://purl.org/rss/1.0/"><title>A two-stage mixed-effects model approach for gene-set analyses in candidate gene studies</title><link>http://dx.doi.org/10.1002%2Fsim.4370</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A two-stage mixed-effects model approach for gene-set analyses in candidate gene studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Roula Tsonaka</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Annette H. M. Helm-van Mil</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jeanine J. Houwing-Duistermaat</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-14T01:11:04.791036-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4370</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4370</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4370</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In genetic association studies, a gene-set analysis can be more powerful than the separate analyses of multiple genetic variants and can offer unique insights into the genetic basis of many common human diseases. The goal of such an analysis is to study the joint effect of multiple single-nucleotide polymorphisms (SNPs) which belong to certain genes, and these genes are assumed to be involved in a common biological function. Currently, few approaches acknowledge the within-genes and between-genes correlations when testing for gene-set effects. Thus, here we propose a two-stage approach, which in the first stage uses a mixed-effects model with a general random-effects structure to capture the correlation between the SNPs and in the second stage tests for gene-set effects by using the empirical Bayes estimates of the random effects of the first stage as covariates in the model for the longitudinal phenotype. The advantage of this approach is its broad applicability because it can be used for any phenotypic outcome and any genetic model and can be implemented with standard statistical software. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In genetic association studies, a gene-set analysis can be more powerful than the separate analyses of multiple genetic variants and can offer unique insights into the genetic basis of many common human diseases. The goal of such an analysis is to study the joint effect of multiple single-nucleotide polymorphisms (SNPs) which belong to certain genes, and these genes are assumed to be involved in a common biological function. Currently, few approaches acknowledge the within-genes and between-genes correlations when testing for gene-set effects. Thus, here we propose a two-stage approach, which in the first stage uses a mixed-effects model with a general random-effects structure to capture the correlation between the SNPs and in the second stage tests for gene-set effects by using the empirical Bayes estimates of the random effects of the first stage as covariates in the model for the longitudinal phenotype. The advantage of this approach is its broad applicability because it can be used for any phenotypic outcome and any genetic model and can be implemented with standard statistical software. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4391" xmlns="http://purl.org/rss/1.0/"><title>Estimating the number of true discoveries in genome-wide association studies</title><link>http://dx.doi.org/10.1002%2Fsim.4391</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating the number of true discoveries in genome-wide association studies</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Woojoo Lee</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">A. Gusnanto</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">A. Salim</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">P. Magnusson</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xueling Sim</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">E.S. Tai</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Y. Pawitan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-11T03:22:55.368058-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4391</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4391</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4391</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Recent genome-wide association studies have reported the discoveries of genetic variants of small to moderate effects. However, most studies of complex diseases face a great challenge because the number of significant variants is less than what is required to explain the disease heritability. A new approach is needed to recognize all potential discoveries in the data. In this paper, we present a practical model-free procedure to estimate the number of true discoveries as a function of the number of top-ranking SNPs together with the confidence bounds. This approach allows a practical methodology of general utility and produces relevant statistical quantities with simple interpretation. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Recent genome-wide association studies have reported the discoveries of genetic variants of small to moderate effects. However, most studies of complex diseases face a great challenge because the number of significant variants is less than what is required to explain the disease heritability. A new approach is needed to recognize all potential discoveries in the data. In this paper, we present a practical model-free procedure to estimate the number of true discoveries as a function of the number of top-ranking SNPs together with the confidence bounds. This approach allows a practical methodology of general utility and produces relevant statistical quantities with simple interpretation. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4354" xmlns="http://purl.org/rss/1.0/"><title>Sensitivity analysis for interactions under unmeasured confounding</title><link>http://dx.doi.org/10.1002%2Fsim.4354</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Sensitivity analysis for interactions under unmeasured confounding</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Tyler J. VanderWeele</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Bhramar Mukherjee</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jinbo Chen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-04T06:29:43.307466-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4354</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4354</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4354</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>We develop a sensitivity analysis technique to assess the sensitivity of interaction analyses to unmeasured confounding. We give bias formulas for sensitivity analysis for interaction under unmeasured confounding on both additive and multiplicative scales. We provide simplified formulas in the case in which either one of the two factors does not interact with the unmeasured confounder in its effects on the outcome. An interesting consequence of the results is that if the two exposures of interest are independent (e.g., gene–environment independence), even under unmeasured confounding, if the estimate of the interaction is nonzero, then either there is a true interaction between the two factors or there is an interaction between one of the factors and the unmeasured confounder; an interaction must be present in either scenario. We apply the results to two examples drawn from the literature. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>We develop a sensitivity analysis technique to assess the sensitivity of interaction analyses to unmeasured confounding. We give bias formulas for sensitivity analysis for interaction under unmeasured confounding on both additive and multiplicative scales. We provide simplified formulas in the case in which either one of the two factors does not interact with the unmeasured confounder in its effects on the outcome. An interesting consequence of the results is that if the two exposures of interest are independent (e.g., gene–environment independence), even under unmeasured confounding, if the estimate of the interaction is nonzero, then either there is a true interaction between the two factors or there is an interaction between one of the factors and the unmeasured confounder; an interaction must be present in either scenario. We apply the results to two examples drawn from the literature. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4386" xmlns="http://purl.org/rss/1.0/"><title>Non-compartmental estimation of pharmacokinetic parameters for flexible sampling designs</title><link>http://dx.doi.org/10.1002%2Fsim.4386</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Non-compartmental estimation of pharmacokinetic parameters for flexible sampling designs</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Thomas Jaki</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Martin J. Wolfsegger</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-03T07:24:30.370382-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4386</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4386</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4386</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Pharmacokinetic (PK) studies aim to understand the kinetics of absorption, distribution, metabolism and elimination of a drug. Typically, such studies involve measuring the concentration of the drug in the plasma or blood at several time points after drug administration. In studying the PK behaviour, either the non-compartmental approach or alternatively a modelling approach can be utilized. Traditionally, the non-compartmental approach makes minimal assumptions about the data-generating process but requires the data to be collected in a very structured way. Conversely, the modelling approach depends heavily on assumptions about the data-generating process but does not impose a specific data structure. In this paper, we will discuss non-compartmental methods for estimating the area under the concentration versus time curve and other common PK parameters that use minimal assumptions about the data structure making it applicable to a wide range of PK studies. We will evaluate the methods using simulation and give an illustrative example. Copycenter © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Pharmacokinetic (PK) studies aim to understand the kinetics of absorption, distribution, metabolism and elimination of a drug. Typically, such studies involve measuring the concentration of the drug in the plasma or blood at several time points after drug administration. In studying the PK behaviour, either the non-compartmental approach or alternatively a modelling approach can be utilized. Traditionally, the non-compartmental approach makes minimal assumptions about the data-generating process but requires the data to be collected in a very structured way. Conversely, the modelling approach depends heavily on assumptions about the data-generating process but does not impose a specific data structure. In this paper, we will discuss non-compartmental methods for estimating the area under the concentration versus time curve and other common PK parameters that use minimal assumptions about the data structure making it applicable to a wide range of PK studies. We will evaluate the methods using simulation and give an illustrative example. Copycenter © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4390" xmlns="http://purl.org/rss/1.0/"><title>Design evaluation and optimisation in crossover pharmacokinetic studies analysed by nonlinear mixed effects models</title><link>http://dx.doi.org/10.1002%2Fsim.4390</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Design evaluation and optimisation in crossover pharmacokinetic studies analysed by nonlinear mixed effects models</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Thu Thuy Nguyen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Caroline Bazzoli</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">France Mentré</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-03T02:31:25.273375-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4390</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4390</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4390</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Bioequivalence or interaction trials are commonly studied in crossover design and can be analysed by nonlinear mixed effects models as an alternative to noncompartmental approach. We propose an extension of the population Fisher information matrix in nonlinear mixed effects models to design crossover pharmacokinetic trials, using a linearisation of the model around the random effect expectation, including within-subject variability and discrete covariates fixed or changing between periods. We use the expected standard errors of treatment effect to compute the power for the Wald test of comparison or equivalence and the number of subjects needed for a given power. We perform various simulations mimicking crossover two-period trials to show the relevance of these developments. We then apply these developments to design a crossover pharmacokinetic study of amoxicillin in piglets and implement them in the new version 3.2 of the <span class="smallCaps">r</span> function PFIM. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Bioequivalence or interaction trials are commonly studied in crossover design and can be analysed by nonlinear mixed effects models as an alternative to noncompartmental approach. We propose an extension of the population Fisher information matrix in nonlinear mixed effects models to design crossover pharmacokinetic trials, using a linearisation of the model around the random effect expectation, including within-subject variability and discrete covariates fixed or changing between periods. We use the expected standard errors of treatment effect to compute the power for the Wald test of comparison or equivalence and the number of subjects needed for a given power. We perform various simulations mimicking crossover two-period trials to show the relevance of these developments. We then apply these developments to design a crossover pharmacokinetic study of amoxicillin in piglets and implement them in the new version 3.2 of the r function PFIM. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4335" xmlns="http://purl.org/rss/1.0/"><title>Syndrome evaluation in traditional Chinese medicine using second-order latent variable model</title><link>http://dx.doi.org/10.1002%2Fsim.4335</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Syndrome evaluation in traditional Chinese medicine using second-order latent variable model</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yang Li</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Danhui Yi</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Huiyun Zhang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yichen Qin</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-10-03T02:05:32.34146-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4335</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4335</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4335</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">00</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">00</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The syndrome is one of the most important concepts and ingredients in the theoretical and clinical research of traditional Chinese medicine (TCM). TCM doctors believe that all diseases are caused by an imbalance in the patient's body, which is called syndrome. All the therapies and formulas in TCM are decided according to the patients' syndrome situation. To quantitatively evaluate the level of syndrome, many statistical methodologies have been discussed in recent years. In this article, we introduce a second-order latent variable model to evaluate the level of patients' syndrome with many clinical symptoms. An objective evaluation score can be easily derived by the proposed model, with a high speed of convergence and without joint-distribution assumption. We illustrate the application of this model by an analysis of premenstrual disorder syndrome of liver-qi invasion syndrome evaluation research. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The syndrome is one of the most important concepts and ingredients in the theoretical and clinical research of traditional Chinese medicine (TCM). TCM doctors believe that all diseases are caused by an imbalance in the patient's body, which is called syndrome. All the therapies and formulas in TCM are decided according to the patients' syndrome situation. To quantitatively evaluate the level of syndrome, many statistical methodologies have been discussed in recent years. In this article, we introduce a second-order latent variable model to evaluate the level of patients' syndrome with many clinical symptoms. An objective evaluation score can be easily derived by the proposed model, with a high speed of convergence and without joint-distribution assumption. We illustrate the application of this model by an analysis of premenstrual disorder syndrome of liver-qi invasion syndrome evaluation research. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4384" xmlns="http://purl.org/rss/1.0/"><title>Competing risks and the clinical community: irrelevance or ignorance?</title><link>http://dx.doi.org/10.1002%2Fsim.4384</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Competing risks and the clinical community: irrelevance or ignorance?</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Michael T. Koller</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Heike Raatz</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ewout W. Steyerberg</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Marcel Wolbers</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-23T05:08:12.62811-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4384</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4384</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4384</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Life expectancy has dramatically increased in industrialized nations over the last 200 hundred years. The aging of populations carries over to clinical research and leads to an increasing representation of elderly and multimorbid individuals in study populations. Clinical research in these populations is complicated by the fact that individuals are likely to experience several potential disease endpoints that prevent some disease-specific endpoint of interest from occurrence. Large developments in competing risks methodology have been achieved over the last decades, but we assume that recognition of competing risks in the clinical community is still marginal. It is the aim of this article to address translational aspects of competing risks to the clinical community. We describe clinical populations where competing risks issues may arise. We then discuss the importance of agreement between the competing risks methodology and the study aim, in particular the distinction between etiologic and prognostic research questions. In a review of 50 clinical studies performed in individuals susceptible to competing risks published in high-impact clinical journals, we found competing risks issues in 70% of all articles. Better recognition of issues related to competing risks and of statistical methods that deal with competing risks in accordance with the aim of the study is needed. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Life expectancy has dramatically increased in industrialized nations over the last 200 hundred years. The aging of populations carries over to clinical research and leads to an increasing representation of elderly and multimorbid individuals in study populations. Clinical research in these populations is complicated by the fact that individuals are likely to experience several potential disease endpoints that prevent some disease-specific endpoint of interest from occurrence. Large developments in competing risks methodology have been achieved over the last decades, but we assume that recognition of competing risks in the clinical community is still marginal. It is the aim of this article to address translational aspects of competing risks to the clinical community. We describe clinical populations where competing risks issues may arise. We then discuss the importance of agreement between the competing risks methodology and the study aim, in particular the distinction between etiologic and prognostic research questions. In a review of 50 clinical studies performed in individuals susceptible to competing risks published in high-impact clinical journals, we found competing risks issues in 70% of all articles. Better recognition of issues related to competing risks and of statistical methods that deal with competing risks in accordance with the aim of the study is needed. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4367" xmlns="http://purl.org/rss/1.0/"><title>Logistic regression analysis of biomarker data subject to pooling and dichotomization</title><link>http://dx.doi.org/10.1002%2Fsim.4367</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Logistic regression analysis of biomarker data subject to pooling and dichotomization</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Z. Zhang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">A. Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">R.H.  Lyles</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">B. Mukherjee</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-23T05:08:06.127808-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4367</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4367</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4367</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>There is growing interest in pooling specimens across subjects in epidemiologic studies, especially those involving biomarkers. This paper is concerned with regression analysis of epidemiologic data where a binary exposure is subject to pooling and the pooled measurement is dichotomized to indicate either that no subjects in the pool are exposed or that some are exposed, without revealing further information about the exposed subjects in the latter case. The pooling process may be stratified on the disease status (a binary outcome) and possibly other variables but is otherwise assumed random. We propose methods for estimating parameters in a prospective logistic regression model and illustrate these with data from a population-based case-control study of colorectal cancer. Simulation results show that the proposed methods perform reasonably well in realistic settings and that pooling can lead to sizable gains in cost efficiency. We make recommendations with regard to the choice of design for pooled epidemiologic studies. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>There is growing interest in pooling specimens across subjects in epidemiologic studies, especially those involving biomarkers. This paper is concerned with regression analysis of epidemiologic data where a binary exposure is subject to pooling and the pooled measurement is dichotomized to indicate either that no subjects in the pool are exposed or that some are exposed, without revealing further information about the exposed subjects in the latter case. The pooling process may be stratified on the disease status (a binary outcome) and possibly other variables but is otherwise assumed random. We propose methods for estimating parameters in a prospective logistic regression model and illustrate these with data from a population-based case-control study of colorectal cancer. Simulation results show that the proposed methods perform reasonably well in realistic settings and that pooling can lead to sizable gains in cost efficiency. We make recommendations with regard to the choice of design for pooled epidemiologic studies. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4369" xmlns="http://purl.org/rss/1.0/"><title>Optimum threshold estimation based on cost function in a multistate diagnostic setting</title><link>http://dx.doi.org/10.1002%2Fsim.4369</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Optimum threshold estimation based on cost function in a multistate diagnostic setting</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Konstantina Skaltsa</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lluís Jover</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">David Fuster</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Josep Lluís Carrasco</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-21T10:59:32.430348-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4369</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4369</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4369</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In the diagnostic area, the usual setting considers two populations: nondiseased and diseased. The use of the standard ROC analysis methodology is well established. Sometimes, however, diagnostic problems inherently include more than two classification states. For example, ‘yes, uncertain, no’ or ‘low, normal, high’. Here we consider a three-normal distribution setting and derive estimators for the optimum thresholds between states based on a cost function. These estimators can be extended for clinical contexts with more than three states. This approach is well known for the two-state setting and its advantage lies in the fact that it accounts for the specific context's properties, such as disease prevalence and classification costs. Here we calculated the variance of the estimators by the use of parametric methods on nonlinear equations and we constructed confidence intervals accounting for possible uncertainty in the threshold estimation. We conducted a simulation study to assess the performance of these estimators and the confidence intervals. Comparisons with the naive threshold estimation method of joining the distributions two-by-two and applying standard ROC techniques proved that the latter method is not reliable for all parameter combinations and should be avoided. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In the diagnostic area, the usual setting considers two populations: nondiseased and diseased. The use of the standard ROC analysis methodology is well established. Sometimes, however, diagnostic problems inherently include more than two classification states. For example, ‘yes, uncertain, no’ or ‘low, normal, high’. Here we consider a three-normal distribution setting and derive estimators for the optimum thresholds between states based on a cost function. These estimators can be extended for clinical contexts with more than three states. This approach is well known for the two-state setting and its advantage lies in the fact that it accounts for the specific context's properties, such as disease prevalence and classification costs. Here we calculated the variance of the estimators by the use of parametric methods on nonlinear equations and we constructed confidence intervals accounting for possible uncertainty in the threshold estimation. We conducted a simulation study to assess the performance of these estimators and the confidence intervals. Comparisons with the naive threshold estimation method of joining the distributions two-by-two and applying standard ROC techniques proved that the latter method is not reliable for all parameter combinations and should be avoided. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4345" xmlns="http://purl.org/rss/1.0/"><title>Considerations on what constitutes a ‘qualified statistician’ in regulatory guidelines</title><link>http://dx.doi.org/10.1002%2Fsim.4345</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Considerations on what constitutes a ‘qualified statistician’ in regulatory guidelines</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Christoph Gerlinger</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lutz Edler</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Tim Friede</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Meinhard Kieser</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Christos T Nakas</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Martin Schumacher</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jørgen Seldrup</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Norbert Victor</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-21T10:57:58.807682-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4345</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4345</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4345</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>International regulatory guidelines require that a ‘qualified statistician’ takes responsibility for the statistical aspects of a clinical trial used for drug licensing. No consensus on what constitutes a ‘qualified statistician’ appears to have been developed so far.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>The International Society for Clinical Biostatistics is issuing this reflection paper in order to stimulate a discussion on the concept. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>International regulatory guidelines require that a ‘qualified statistician’ takes responsibility for the statistical aspects of a clinical trial used for drug licensing. No consensus on what constitutes a ‘qualified statistician’ appears to have been developed so far.The International Society for Clinical Biostatistics is issuing this reflection paper in order to stimulate a discussion on the concept. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4363" xmlns="http://purl.org/rss/1.0/"><title>Bayesian adaptive clinical trials: a dream for statisticians only?</title><link>http://dx.doi.org/10.1002%2Fsim.4363</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Bayesian adaptive clinical trials: a dream for statisticians only?</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Sylvie Chevret</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-09T04:55:35.425348-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4363</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4363</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4363</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>Adaptive or ‘flexible’ designs have emerged, mostly within frequentist frameworks, as an effective way to speed up the therapeutic evaluation process. Because of their flexibility, Bayesian methods have also been proposed for Phase I through Phase III adaptive trials; however, it has been reported that they are poorly used in practice. We aim to describe the international scientific production of Bayesian clinical trials by investigating the actual development and use of Bayesian ‘adaptive’ methods in the setting of clinical trials. A bibliometric study was conducted using the PubMed and Science Citation Index-Expanded databases. Most of the references found were biostatistical papers from various teams around the world. Most of the authors were from the US, and a large proportion was from the MD Anderson Cancer Center (University of Texas, Houston, TX). The spread and use of these articles depended heavily on their topic, with 3.1% of the biostatistical articles accumulating at least 25 citations within 5 years of their publication compared with 15% of the reviews and 32% of the clinical articles. We also examined the reasons for the limited use of Bayesian adaptive design methods in clinical trials and the areas of current and future research to address these challenges. Efforts to promote Bayesian approaches among statisticians and clinicians appear necessary. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Adaptive or ‘flexible’ designs have emerged, mostly within frequentist frameworks, as an effective way to speed up the therapeutic evaluation process. Because of their flexibility, Bayesian methods have also been proposed for Phase I through Phase III adaptive trials; however, it has been reported that they are poorly used in practice. We aim to describe the international scientific production of Bayesian clinical trials by investigating the actual development and use of Bayesian ‘adaptive’ methods in the setting of clinical trials. A bibliometric study was conducted using the PubMed and Science Citation Index-Expanded databases. Most of the references found were biostatistical papers from various teams around the world. Most of the authors were from the US, and a large proportion was from the MD Anderson Cancer Center (University of Texas, Houston, TX). The spread and use of these articles depended heavily on their topic, with 3.1% of the biostatistical articles accumulating at least 25 citations within 5 years of their publication compared with 15% of the reviews and 32% of the clinical articles. We also examined the reasons for the limited use of Bayesian adaptive design methods in clinical trials and the areas of current and future research to address these challenges. Efforts to promote Bayesian approaches among statisticians and clinicians appear necessary. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4356" xmlns="http://purl.org/rss/1.0/"><title>Identifying influential observations in Bayesian models by using Markov chain Monte Carlo</title><link>http://dx.doi.org/10.1002%2Fsim.4356</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Identifying influential observations in Bayesian models by using Markov chain Monte Carlo</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Dan Jackson</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ian R. White</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">James Carpenter</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-09-08T06:53:52.212988-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4356</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4356</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4356</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>In statistical modelling, it is often important to know how much parameter estimates are influenced by particular observations. An attractive approach is to re-estimate the parameters with each observation deleted in turn, but this is computationally demanding when fitting models by using Markov chain Monte Carlo (MCMC), as obtaining complete sample estimates is often in itself a very time-consuming task. Here we propose two efficient ways to approximate the case-deleted estimates by using output from MCMC estimation. Our first proposal, which directly approximates the usual influence statistics in maximum likelihood analyses of generalised linear models (GLMs), is easy to implement and avoids any further evaluation of the likelihood. Hence, unlike the existing alternatives, it does not become more computationally intensive as the model complexity increases. Our second proposal, which utilises model perturbations, also has this advantage and does not require the form of the GLM to be specified. We show how our two proposed methods are related and evaluate them against the existing method of importance sampling and case deletion in a logistic regression analysis with missing covariates. We also provide practical advice for those implementing our procedures, so that they may be used in many situations where MCMC is used to fit statistical models. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In statistical modelling, it is often important to know how much parameter estimates are influenced by particular observations. An attractive approach is to re-estimate the parameters with each observation deleted in turn, but this is computationally demanding when fitting models by using Markov chain Monte Carlo (MCMC), as obtaining complete sample estimates is often in itself a very time-consuming task. Here we propose two efficient ways to approximate the case-deleted estimates by using output from MCMC estimation. Our first proposal, which directly approximates the usual influence statistics in maximum likelihood analyses of generalised linear models (GLMs), is easy to implement and avoids any further evaluation of the likelihood. Hence, unlike the existing alternatives, it does not become more computationally intensive as the model complexity increases. Our second proposal, which utilises model perturbations, also has this advantage and does not require the form of the GLM to be specified. We show how our two proposed methods are related and evaluate them against the existing method of importance sampling and case deletion in a logistic regression analysis with missing covariates. We also provide practical advice for those implementing our procedures, so that they may be used in many situations where MCMC is used to fit statistical models. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4304" xmlns="http://purl.org/rss/1.0/"><title>Estimation and testing based on data subject to measurement errors: from parametric to non-parametric likelihood methods</title><link>http://dx.doi.org/10.1002%2Fsim.4304</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimation and testing based on data subject to measurement errors: from parametric to non-parametric likelihood methods</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Albert Vexler</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Wan-Min Tsai</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yaakov Malinovsky</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-07-29T06:53:20.091399-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4304</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4304</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4304</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Measurement error (ME) problems can cause bias or inconsistency of statistical inferences. When investigators are unable to obtain correct measurements of biological assays, special techniques to quantify MEs need to be applied. Sampling based on repeated measurements is a common strategy to allow for ME. This method has been well addressed in the literature under parametric assumptions. The approach with repeated measures data may not be applicable when the replications are complicated because of cost and/or time concerns. Pooling designs have been proposed as cost-efficient sampling procedures that can assist to provide correct statistical operations based on data subject to ME. We demonstrate that a mixture of both pooled and unpooled data (a hybrid pooled–unpooled design) can support very efficient estimation and testing in the presence of ME. Nonparametric techniques have not been well investigated to analyze repeated measures data or pooled data subject to ME. We propose and examine both the parametric and empirical likelihood methodologies for data subject to ME. We conclude that the likelihood methods based on the hybrid samples are very efficient and powerful. The results of an extensive Monte Carlo study support our conclusions. Real data examples demonstrate the efficiency of the proposed methods in practice. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Measurement error (ME) problems can cause bias or inconsistency of statistical inferences. When investigators are unable to obtain correct measurements of biological assays, special techniques to quantify MEs need to be applied. Sampling based on repeated measurements is a common strategy to allow for ME. This method has been well addressed in the literature under parametric assumptions. The approach with repeated measures data may not be applicable when the replications are complicated because of cost and/or time concerns. Pooling designs have been proposed as cost-efficient sampling procedures that can assist to provide correct statistical operations based on data subject to ME. We demonstrate that a mixture of both pooled and unpooled data (a hybrid pooled–unpooled design) can support very efficient estimation and testing in the presence of ME. Nonparametric techniques have not been well investigated to analyze repeated measures data or pooled data subject to ME. We propose and examine both the parametric and empirical likelihood methodologies for data subject to ME. We conclude that the likelihood methods based on the hybrid samples are very efficient and powerful. The results of an extensive Monte Carlo study support our conclusions. Real data examples demonstrate the efficiency of the proposed methods in practice. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4275" xmlns="http://purl.org/rss/1.0/"><title>Random effects models for assessing diagnostic accuracy of traditional Chinese doctors in absence of a gold standard</title><link>http://dx.doi.org/10.1002%2Fsim.4275</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Random effects models for assessing diagnostic accuracy of traditional Chinese doctors in absence of a gold standard</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zheyu Wang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xiao-Hua Zhou</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-05-31T01:54:36.874914-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4275</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4275</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4275</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>Two common problems in assessing the accuracy of traditional Chinese medicine (TCM) doctors in detecting a particular symptom are the unknown true symptom status and the ordinal-scale of the symptom status. Wang <em>et al.</em> (<em>Biostatistics</em> 2011; DOI: <a class="accessionId" href="http://dx.doi.org/10.1093/biostatistics/kxq075" title="Link to external resource: 10.1093/biostatistics/kxq075">10.1093/biostatistics/kxq075</a>) proposed a nonparametric maximum likelihood method for estimating the accuracy of different TCM doctors without a gold standard when the true symptom status is measured on an ordinal-scale. A key assumption of their work is that the diagnosis results are independent conditional on the gold standard. This assumption can be violated in many practical situations. In this paper, we propose a random effects modeling approach that extends their method to incorporate dependence structure among different tests or doctors. The proposed method is illustrated on a real data set from TCM, which contains the diagnostic results from five doctors for the same patients regarding symptoms related to Chills disease. The same data set was analyzed by Wang <em>et al.</em> under the conditional independence assumption. In addition, we also discuss an <em>ad hoc</em> test for the model fitting and a likelihood ratio test on the random effects. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Two common problems in assessing the accuracy of traditional Chinese medicine (TCM) doctors in detecting a particular symptom are the unknown true symptom status and the ordinal-scale of the symptom status. Wang et al. (Biostatistics 2011; DOI: 10.1093/biostatistics/kxq075) proposed a nonparametric maximum likelihood method for estimating the accuracy of different TCM doctors without a gold standard when the true symptom status is measured on an ordinal-scale. A key assumption of their work is that the diagnosis results are independent conditional on the gold standard. This assumption can be violated in many practical situations. In this paper, we propose a random effects modeling approach that extends their method to incorporate dependence structure among different tests or doctors. The proposed method is illustrated on a real data set from TCM, which contains the diagnostic results from five doctors for the same patients regarding symptoms related to Chills disease. The same data set was analyzed by Wang et al. under the conditional independence assumption. In addition, we also discuss an ad hoc test for the model fitting and a likelihood ratio test on the random effects. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4242" xmlns="http://purl.org/rss/1.0/"><title>A simulation study of predictive ability measures in a survival model I: Explained variation measures</title><link>http://dx.doi.org/10.1002%2Fsim.4242</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">A simulation study of predictive ability measures in a survival model I: Explained variation measures</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Babak Choodari-Oskooei</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Patrick Royston</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Mahesh K. B. Parmar</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-04-26T05:45:49.093556-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4242</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4242</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4242</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>Measures of predictive ability play an important role in quantifying the clinical significance of prognostic factors. Several measures have been proposed to evaluate the predictive ability of survival models in the last two decades, but no single measure is consistently used. The proposed measures can be classified into the following categories: explained variation, explained randomness, and predictive accuracy. The three categories are conceptually different and are based on different principles. Several new measures have been proposed since Schemper and Stare's study in 1996 on some of the existing measures. This paper is the first of two papers that study the proposed measures systematically by applying a set of criteria that a measure of predictive ability should possess in the context of survival analysis. The present paper focuses on the explained variation category, and part II studies the proposed measures in the other categories. Simulation studies are used to examine the performance of five explained variation measures with respect to these criteria, discussing their strengths and shortcomings. Our simulation studies show that the measures proposed by Kent and O'Quigley, <b><em>R</em></b><span><img alt="math image" src="http://onlinelibrary.wiley.com/store/10.1002/sim.4242/asset/equation/tex2gif-stack-1.gif?v=1&amp;t=gynklhgo&amp;s=029c48a565dd579fc5efc7e27ec465b5022c63ba" class="inlineGraphic"/></span>, and Royston and Sauerbrei, <b><em>R</em></b><span><img alt="math image" src="http://onlinelibrary.wiley.com/store/10.1002/sim.4242/asset/equation/tex2gif-stack-2.gif?v=1&amp;t=gynklhgq&amp;s=171b2a92bbd6fffd7f5c1e7c87ffa6072aab1e58" class="inlineGraphic"/></span>, appear to be the best overall at quantifying predictive ability. However, it should be noted that neither measure is perfect; <b><em>R</em></b><span><img alt="math image" src="http://onlinelibrary.wiley.com/store/10.1002/sim.4242/asset/equation/tex2gif-stack-3.gif?v=1&amp;t=gynklhgs&amp;s=a8524db304da161fafc9e976ed4714e31de679f8" class="inlineGraphic"/></span> is sensitive to outliers and <b><em>R</em></b><span><img alt="math image" src="http://onlinelibrary.wiley.com/store/10.1002/sim.4242/asset/equation/tex2gif-stack-4.gif?v=1&amp;t=gynklhgt&amp;s=c70ed3650f934ea7df9c8a65caf45ec925167dc3" class="inlineGraphic"/></span> to (marked) non-normality of the distribution of the prognostic index. The results show that the other measures perform poorly, primarily because they are adversely affected by censoring. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Measures of predictive ability play an important role in quantifying the clinical significance of prognostic factors. Several measures have been proposed to evaluate the predictive ability of survival models in the last two decades, but no single measure is consistently used. The proposed measures can be classified into the following categories: explained variation, explained randomness, and predictive accuracy. The three categories are conceptually different and are based on different principles. Several new measures have been proposed since Schemper and Stare's study in 1996 on some of the existing measures. This paper is the first of two papers that study the proposed measures systematically by applying a set of criteria that a measure of predictive ability should possess in the context of survival analysis. The present paper focuses on the explained variation category, and part II studies the proposed measures in the other categories. Simulation studies are used to examine the performance of five explained variation measures with respect to these criteria, discussing their strengths and shortcomings. Our simulation studies show that the measures proposed by Kent and O'Quigley, R PM2, and Royston and Sauerbrei, R D2, appear to be the best overall at quantifying predictive ability. However, it should be noted that neither measure is perfect; R PM2 is sensitive to outliers and R D2 to (marked) non-normality of the distribution of the prognostic index. The results show that the other measures perform poorly, primarily because they are adversely affected by censoring. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4146" xmlns="http://purl.org/rss/1.0/"><title>Discovering herbal functional groups of traditional Chinese medicine</title><link>http://dx.doi.org/10.1002%2Fsim.4146</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Discovering herbal functional groups of traditional Chinese medicine</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ping He</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ke Deng</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhihai Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Delin Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Jun S. Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhi Geng</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-03-17T05:17:04.98299-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4146</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4146</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4146</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>For the traditional Chinese medicine (TCM), a prescription for a patient often contains several herbs. Some herbs are often used together in prescriptions, and these herbs can be considered as a functional group. In this paper, we propose an approach for discovering herbal functional groups from a large set of prescriptions recorded in TCM books. These functional groups are allowed to overlap with each other. Our approach is validated with a simulation study and applied to a data set containing thousands of TCM prescriptions. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>For the traditional Chinese medicine (TCM), a prescription for a patient often contains several herbs. Some herbs are often used together in prescriptions, and these herbs can be considered as a functional group. In this paper, we propose an approach for discovering herbal functional groups from a large set of prescriptions recorded in TCM books. These functional groups are allowed to overlap with each other. Our approach is validated with a simulation study and applied to a data set containing thousands of TCM prescriptions. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4168" xmlns="http://purl.org/rss/1.0/"><title>Generalized propensity score for estimating the average treatment effect of multiple treatments</title><link>http://dx.doi.org/10.1002%2Fsim.4168</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Generalized propensity score for estimating the average treatment effect of multiple treatments</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ping Feng</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xiao-Hua Zhou</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Qing-Ming Zou</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ming-Yu Fan</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xiao-Song Li</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-02-24T03:50:02.281042-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4168</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4168</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4168</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>The propensity score method is widely used in clinical studies to estimate the effect of a treatment with two levels on patient's outcomes. However, due to the complexity of many diseases, an effective treatment often involves multiple components. For example, in the practice of Traditional Chinese Medicine (TCM), an effective treatment may include multiple components, e.g. Chinese herbs, acupuncture, and massage therapy. In clinical trials involving TCM, patients could be randomly assigned to either the treatment or control group, but they or their doctors may make different choices about which treatment component to use. As a result, treatment components are not randomly assigned. Rosenbaum and Rubin proposed the propensity score method for binary treatments, and Imbens extended their work to multiple treatments. These authors defined the generalized propensity score as the conditional probability of receiving a particular level of the treatment given the pre-treatment variables. In the present work, we adopted this approach and developed a statistical methodology based on the generalized propensity score in order to estimate treatment effects in the case of multiple treatments. Two methods were discussed and compared: propensity score regression adjustment and propensity score weighting. We used these methods to assess the relative effectiveness of individual treatments in the multiple-treatment IMPACT clinical trial. The results reveal that both methods perform well when the sample size is moderate or large. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The propensity score method is widely used in clinical studies to estimate the effect of a treatment with two levels on patient's outcomes. However, due to the complexity of many diseases, an effective treatment often involves multiple components. For example, in the practice of Traditional Chinese Medicine (TCM), an effective treatment may include multiple components, e.g. Chinese herbs, acupuncture, and massage therapy. In clinical trials involving TCM, patients could be randomly assigned to either the treatment or control group, but they or their doctors may make different choices about which treatment component to use. As a result, treatment components are not randomly assigned. Rosenbaum and Rubin proposed the propensity score method for binary treatments, and Imbens extended their work to multiple treatments. These authors defined the generalized propensity score as the conditional probability of receiving a particular level of the treatment given the pre-treatment variables. In the present work, we adopted this approach and developed a statistical methodology based on the generalized propensity score in order to estimate treatment effects in the case of multiple treatments. Two methods were discussed and compared: propensity score regression adjustment and propensity score weighting. We used these methods to assess the relative effectiveness of individual treatments in the multiple-treatment IMPACT clinical trial. The results reveal that both methods perform well when the sample size is moderate or large. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4003" xmlns="http://purl.org/rss/1.0/"><title>Evaluating traditional Chinese medicine using modern clinical trial design and statistical methodology: Application to a randomized controlled acupuncture trial</title><link>http://dx.doi.org/10.1002%2Fsim.4003</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Evaluating traditional Chinese medicine using modern clinical trial design and statistical methodology: Application to a randomized controlled acupuncture trial</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lixing Lao</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yi Huang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Chiguang Feng</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Brian M. Berman</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ming T. Tan</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-02-23T04:17:48.235229-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4003</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4003</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4003</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>Traditional Chinese medicine (TCM), used in China and other Asian counties for thousands of years, is increasingly utilized in Western countries. However, due to inherent differences in how Western medicine and this ancient modality are practiced, employing the so-called Western medicine-based gold standard research methods to evaluate TCM is challenging. This paper is a discussion of the obstacles inherent in the design and statistical analysis of clinical trials of TCM. It is based on our experience in designing and conducting a randomized controlled clinical trial of acupuncture for post-operative dental pain control in which acupuncture was shown to be statistically and significantly better than placebo in lengthening the median survival time to rescue drug. We demonstrate here that PH assumptions in the common Cox model did not hold in that trial and that TCM trials warrant more thoughtful modeling and more sophisticated models of statistical analysis. TCM study design entails all the challenges encountered in trials of drugs, devices, and surgical procedures in the Western medicine. We present possible solutions to some but leave many issues unresolved. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Traditional Chinese medicine (TCM), used in China and other Asian counties for thousands of years, is increasingly utilized in Western countries. However, due to inherent differences in how Western medicine and this ancient modality are practiced, employing the so-called Western medicine-based gold standard research methods to evaluate TCM is challenging. This paper is a discussion of the obstacles inherent in the design and statistical analysis of clinical trials of TCM. It is based on our experience in designing and conducting a randomized controlled clinical trial of acupuncture for post-operative dental pain control in which acupuncture was shown to be statistically and significantly better than placebo in lengthening the median survival time to rescue drug. We demonstrate here that PH assumptions in the common Cox model did not hold in that trial and that TCM trials warrant more thoughtful modeling and more sophisticated models of statistical analysis. TCM study design entails all the challenges encountered in trials of drugs, devices, and surgical procedures in the Western medicine. We present possible solutions to some but leave many issues unresolved. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4034" xmlns="http://purl.org/rss/1.0/"><title>Issues of design and statistical analysis in controlled clinical acupuncture trials: An analysis of English-language reports from Western journals</title><link>http://dx.doi.org/10.1002%2Fsim.4034</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Issues of design and statistical analysis in controlled clinical acupuncture trials: An analysis of English-language reports from Western journals</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ping Shuai</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xiao-Hua Zhou</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Lixing Lao</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xiaosong Li</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-02-22T03:12:10.466252-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4034</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4034</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4034</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p><b>Objective</b>: To investigate major methods of design and statistical analysis in controlled clinical acupuncture trials published in the West during the past six years (2003–2009) and, based on this analysis, to provide recommendations that address methodological issues and challenges in clinical acupuncture research.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p><b><em>Method</em></b>: PubMed was searched for acupuncture RCTs published in Western journals in English between 2003 and 2009. The keyword used was acupuncture.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p><b>Results</b>: One hundred and eight qualified reports of acupuncture trials that included more than 30 symptoms/conditions were identified, analyzed, and grouped into efficacy (explanatory), effectiveness (pragmatically beneficial), and other (unspecified) studies. All were randomized controlled clinical trials (RCTs). In spite of significant improvement in the quality of acupuncture RCTs in the last 30 years, these reports show that some methodological issues and shortcomings in design and analysis remain. Moreover, the quality of the efficacy studies was not superior to that of the other types of studies. Research design and reporting problems include unclear patient criteria and inadequate practitioner eligibility, inadequate randomization, and blinding, deficiencies in the selection of controls, and improper outcome measurements. The problems in statistical analysis included insufficient sample sizes and power calculations, inadequate handling of missing data and multiple comparisons, and inefficient methods for dealing with repeated measure and cluster data, baseline value adjustment, and confounding issues.</p></div><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p><b>Conclusion</b>: Despite recent advancements in acupuncture research, acupuncture RCTs can be improved, and more rigorous research methods should be carefully considered. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Objective: To investigate major methods of design and statistical analysis in controlled clinical acupuncture trials published in the West during the past six years (2003–2009) and, based on this analysis, to provide recommendations that address methodological issues and challenges in clinical acupuncture research.Method: PubMed was searched for acupuncture RCTs published in Western journals in English between 2003 and 2009. The keyword used was acupuncture.Results: One hundred and eight qualified reports of acupuncture trials that included more than 30 symptoms/conditions were identified, analyzed, and grouped into efficacy (explanatory), effectiveness (pragmatically beneficial), and other (unspecified) studies. All were randomized controlled clinical trials (RCTs). In spite of significant improvement in the quality of acupuncture RCTs in the last 30 years, these reports show that some methodological issues and shortcomings in design and analysis remain. Moreover, the quality of the efficacy studies was not superior to that of the other types of studies. Research design and reporting problems include unclear patient criteria and inadequate practitioner eligibility, inadequate randomization, and blinding, deficiencies in the selection of controls, and improper outcome measurements. The problems in statistical analysis included insufficient sample sizes and power calculations, inadequate handling of missing data and multiple comparisons, and inefficient methods for dealing with repeated measure and cluster data, baseline value adjustment, and confounding issues.Conclusion: Despite recent advancements in acupuncture research, acupuncture RCTs can be improved, and more rigorous research methods should be carefully considered. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.3980" xmlns="http://purl.org/rss/1.0/"><title>Variable selection using the optimal ROC curve: An application to a traditional Chinese medicine study on osteoporosis disease</title><link>http://dx.doi.org/10.1002%2Fsim.3980</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Variable selection using the optimal ROC curve: An application to a traditional Chinese medicine study on osteoporosis disease</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">X. H. Zhou</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">B. Chen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Y. M. Xie</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">F. Tian</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">H. Liu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">X. Liang</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2011-02-03T05:33:45.218982-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.3980</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.3980</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.3980</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Special Issue Paper</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">n/a</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<h3 xhtml="http://www.w3.org/1999/xhtml" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib">Abstract</h3><div class="para" xmlns="http://www.w3.org/1999/xhtml"><p>In biomedical studies, there are multiple sources of information available of which only a small number of them are associated with the diseases. It is of importance to select and combine these factors that are associated with the disease in order to predict the disease status of a new subject. The receiving operating characteristic (ROC) technique has been widely used in disease classification, and the classification accuracy can be measured with area under the ROC curve (AUC). In this article, we combine recent variable selection methods with AUC methods to optimize diagnostic accuracy of multiple risk factors. We first describe one new and some recent AUC-based methods for effectively combining multiple risk factors for disease classification. We then apply them to analyze the data from a new clinical study, investigating whether a combination of traditional Chinese medicine symptoms and standard Western medicine risk factors can increase discriminative accuracy in diagnosing osteoporosis (OP). Based on the results, we conclude that we can make a better diagnosis of primary OP by combining traditional Chinese medicine symptoms with Western medicine risk factors. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In biomedical studies, there are multiple sources of information available of which only a small number of them are associated with the diseases. It is of importance to select and combine these factors that are associated with the disease in order to predict the disease status of a new subject. The receiving operating characteristic (ROC) technique has been widely used in disease classification, and the classification accuracy can be measured with area under the ROC curve (AUC). In this article, we combine recent variable selection methods with AUC methods to optimize diagnostic accuracy of multiple risk factors. We first describe one new and some recent AUC-based methods for effectively combining multiple risk factors for disease classification. We then apply them to analyze the data from a new clinical study, investigating whether a combination of traditional Chinese medicine symptoms and standard Western medicine risk factors can increase discriminative accuracy in diagnosing osteoporosis (OP). Based on the results, we conclude that we can make a better diagnosis of primary OP by combining traditional Chinese medicine symptoms with Western medicine risk factors. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4432" xmlns="http://purl.org/rss/1.0/"><title>Enriched designs for assessing discriminatory performance — analysis of bias and variance</title><link>http://dx.doi.org/10.1002%2Fsim.4432</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Enriched designs for assessing discriminatory performance — analysis of bias and variance</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Paul F. Pinsky</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">B. Gallas</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4432</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4432</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4432</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">501</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">515</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In evaluating discriminatory performance of a new modality in a screening setting, a logistical constraint is that the prevalence of the disease of interest is typically very low. This implies that under a standard study design large numbers of subjects have to be evaluated using the new modality. However, if a predicate modality exists in clinical practice, one can base inclusion into the study of the new modality on the clinical results from the predicate to ‘enrich’ the population of diseased subjects in the study. If this enrichment is not accounted for when estimating sensitivity, specificity, and area under the ROC curve, these ‘naive’ estimates may be substantially biased compared with expected performance in the intended use population. We derive expressions for the magnitude of this bias in terms of correlations of modality scores. When such estimates are ‘corrected’ for the sampling weights using inverse probability weighting, the variances of the estimates of the above quantities are affected. We derive here analytic expressions for these variances. For a fixed number of diseased subjects, differential sampling increases the variance of the (corrected) estimates, all other things being equal. However, differential sampling also increases the number with disease for fixed total study size, which decreases the variance of the sensitivity and area under the ROC curve estimates, all other things being equal. The balance of these two effects determines the gain in efficiency when using enrichment and corrected estimates. These principles are illustrated with a simulation study motivated by the Digital Mammographic Imaging Screening Trial study, a trial of digital versus screen film mammography. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In evaluating discriminatory performance of a new modality in a screening setting, a logistical constraint is that the prevalence of the disease of interest is typically very low. This implies that under a standard study design large numbers of subjects have to be evaluated using the new modality. However, if a predicate modality exists in clinical practice, one can base inclusion into the study of the new modality on the clinical results from the predicate to ‘enrich’ the population of diseased subjects in the study. If this enrichment is not accounted for when estimating sensitivity, specificity, and area under the ROC curve, these ‘naive’ estimates may be substantially biased compared with expected performance in the intended use population. We derive expressions for the magnitude of this bias in terms of correlations of modality scores. When such estimates are ‘corrected’ for the sampling weights using inverse probability weighting, the variances of the estimates of the above quantities are affected. We derive here analytic expressions for these variances. For a fixed number of diseased subjects, differential sampling increases the variance of the (corrected) estimates, all other things being equal. However, differential sampling also increases the number with disease for fixed total study size, which decreases the variance of the sensitivity and area under the ROC curve estimates, all other things being equal. The balance of these two effects determines the gain in efficiency when using enrichment and corrected estimates. These principles are illustrated with a simulation study motivated by the Digital Mammographic Imaging Screening Trial study, a trial of digital versus screen film mammography. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4425" xmlns="http://purl.org/rss/1.0/"><title>An adaptive dose-finding approach for correlated bivariate binary and continuous outcomes in phase I oncology trials</title><link>http://dx.doi.org/10.1002%2Fsim.4425</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">An adaptive dose-finding approach for correlated bivariate binary and continuous outcomes in phase I oncology trials</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Akihiro Hirakawa</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4425</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4425</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4425</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">516</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">532</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>In this study, we developed a novel adaptive dose-finding approach for inclusion of correlated bivariate binary and continuous outcomes in designing phase I oncology trials. For this approach, binary toxicity and continuous efficacy outcomes are modeled jointly with a factorization model. The basic strategy of the proposed approach is based primarily on the Bayesian method. We based the dose escalation/de-escalation decision rules on the posterior distributions of both toxicity and efficacy outcomes. We compared the operating characteristics of the proposed and existing methods through simulation studies under various scenarios. We found that the recommendation rate of the true recommended dose (RD) in the proposed method was more favorable than that in the existing method when the true RD was relatively at the tail end among the tested doses. It was similar to that of the existing method when the true RD was relatively at the top end. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>In this study, we developed a novel adaptive dose-finding approach for inclusion of correlated bivariate binary and continuous outcomes in designing phase I oncology trials. For this approach, binary toxicity and continuous efficacy outcomes are modeled jointly with a factorization model. The basic strategy of the proposed approach is based primarily on the Bayesian method. We based the dose escalation/de-escalation decision rules on the posterior distributions of both toxicity and efficacy outcomes. We compared the operating characteristics of the proposed and existing methods through simulation studies under various scenarios. We found that the recommendation rate of the true recommended dose (RD) in the proposed method was more favorable than that in the existing method when the true RD was relatively at the tail end among the tested doses. It was similar to that of the existing method when the true RD was relatively at the top end. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4423" xmlns="http://purl.org/rss/1.0/"><title>Estimating net transition probabilities from cross-sectional data with application to risk factors in chronic disease modeling</title><link>http://dx.doi.org/10.1002%2Fsim.4423</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Estimating net transition probabilities from cross-sectional data with application to risk factors in chronic disease modeling</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">J. van de Kassteele</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">R.T. Hoogenveen</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">P.M. Engelfriet</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">P.H.M. van Baal</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">H.C. Boshuizen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4423</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4423</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4423</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">533</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">543</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>A problem occurring in chronic disease modeling is the estimation of transition probabilities of moving from one state of a categorical risk factor to another. Transitions could be obtained from a cohort study, but often such data may not be available. However, under the assumption that transitions remain stable over time, age specific cross-sectional prevalence data could be used instead. Problems that then arise are parameter identifiability and the fact that age dependent cross-sectional data are often noisy or are given in age intervals. In this paper we propose a method to estimate so-called net annual transition probabilities from cross-sectional data, including their uncertainties. Net transitions only describe the net inflow or outflow into a certain risk factor state at a certain age. Our approach consists of two steps: first, smooth the data using multinomial P-splines, second, from these data estimate net transition probabilities. This second step can be formulated as a transportation problem, which is solved using the simplex algorithm from linear programming theory. A sensible specification of the cost matrix is crucial to get meaningful results. Uncertainties are assessed by parametric bootstrapping. We illustrate our method using data on body mass index. We conclude that this method provides a flexible way of estimating net transitions and that the use of net transitions has implications for model dynamics, for example when modeling interventions. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>A problem occurring in chronic disease modeling is the estimation of transition probabilities of moving from one state of a categorical risk factor to another. Transitions could be obtained from a cohort study, but often such data may not be available. However, under the assumption that transitions remain stable over time, age specific cross-sectional prevalence data could be used instead. Problems that then arise are parameter identifiability and the fact that age dependent cross-sectional data are often noisy or are given in age intervals. In this paper we propose a method to estimate so-called net annual transition probabilities from cross-sectional data, including their uncertainties. Net transitions only describe the net inflow or outflow into a certain risk factor state at a certain age. Our approach consists of two steps: first, smooth the data using multinomial P-splines, second, from these data estimate net transition probabilities. This second step can be formulated as a transportation problem, which is solved using the simplex algorithm from linear programming theory. A sensible specification of the cost matrix is crucial to get meaningful results. Uncertainties are assessed by parametric bootstrapping. We illustrate our method using data on body mass index. We conclude that this method provides a flexible way of estimating net transitions and that the use of net transitions has implications for model dynamics, for example when modeling interventions. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4420" xmlns="http://purl.org/rss/1.0/"><title>Finite mixture varying coefficient models for analyzing longitudinal heterogenous data</title><link>http://dx.doi.org/10.1002%2Fsim.4420</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Finite mixture varying coefficient models for analyzing longitudinal heterogenous data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Zhaohua Lu</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Xinyuan Song</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4420</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4420</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4420</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">544</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">560</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>This paper aims to develop a mixture model to study heterogeneous longitudinal data on the treatment effect of heroin use from a California Civil Addict Program. Each component of the mixture is characterized by a varying coefficient mixed effect model. We use the Bayesian P-splines approach to approximate the varying coefficient functions. We develop Markov chain Monte Carlo algorithms to estimate the smooth functions, unknown parameters, and latent variables in the model. We use modified deviance information criterion to determine the number of components in the mixture. A simulation study demonstrates that the modified deviance information criterion selects the correct number of components and the estimation of unknown quantities is accurate. We apply the proposed model to the heroin treatment study. Furthermore, we identify heterogeneous longitudinal patterns. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>This paper aims to develop a mixture model to study heterogeneous longitudinal data on the treatment effect of heroin use from a California Civil Addict Program. Each component of the mixture is characterized by a varying coefficient mixed effect model. We use the Bayesian P-splines approach to approximate the varying coefficient functions. We develop Markov chain Monte Carlo algorithms to estimate the smooth functions, unknown parameters, and latent variables in the model. We use modified deviance information criterion to determine the number of components in the mixture. A simulation study demonstrates that the modified deviance information criterion selects the correct number of components and the estimation of unknown quantities is accurate. We apply the proposed model to the heroin treatment study. Furthermore, we identify heterogeneous longitudinal patterns. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4450" xmlns="http://purl.org/rss/1.0/"><title>Restricted mean models for transplant benefit and urgency</title><link>http://dx.doi.org/10.1002%2Fsim.4450</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Restricted mean models for transplant benefit and urgency</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Fang Xiang</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Susan Murray</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4450</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4450</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4450</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">561</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">576</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The US lung allocation policy estimates each individual's urgency and transplant benefit in defining a lung allocation score (LAS). Transplant benefit, as defined by the Organ Procurement and Transplantation Network Thoracic Committee, is the days of life gained over the following year if transplanted versus not transplanted. Urgency is measured by days of life during the next year without transplant. In both definitions, accurate estimation of wait list days lived, or a wait list restricted mean lifetime, is required. Risk factors are available to estimate patient urgency when listed, with more urgent patients removed from the wait list upon death or transplant. As a patient progresses, priority for transplant (censoring) changes accordingly. Therefore, it is crucial to adjust for dependent censoring in modeling days of life. We develop a model for the restricted mean as a function of covariates, by using pseudo-observations that account for dependent censoring linked to a series of longitudinal measures (LAS). Simulation results show that our method performs well in situations comparable with the LAS setting. Applying wait list and post-transplant model results that account for dependent censoring to wait list patients, we obtain estimates of transplant benefit that are larger for many of the more urgent patients in need of transplant. The difference in LAS for an individual, when properly accounting for dependent censoring, has high impact on the priority and timing of an organ offer for these patients. Copyright © 2012 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The US lung allocation policy estimates each individual's urgency and transplant benefit in defining a lung allocation score (LAS). Transplant benefit, as defined by the Organ Procurement and Transplantation Network Thoracic Committee, is the days of life gained over the following year if transplanted versus not transplanted. Urgency is measured by days of life during the next year without transplant. In both definitions, accurate estimation of wait list days lived, or a wait list restricted mean lifetime, is required. Risk factors are available to estimate patient urgency when listed, with more urgent patients removed from the wait list upon death or transplant. As a patient progresses, priority for transplant (censoring) changes accordingly. Therefore, it is crucial to adjust for dependent censoring in modeling days of life. We develop a model for the restricted mean as a function of covariates, by using pseudo-observations that account for dependent censoring linked to a series of longitudinal measures (LAS). Simulation results show that our method performs well in situations comparable with the LAS setting. Applying wait list and post-transplant model results that account for dependent censoring to wait list patients, we obtain estimates of transplant benefit that are larger for many of the more urgent patients in need of transplant. The difference in LAS for an individual, when properly accounting for dependent censoring, has high impact on the priority and timing of an organ offer for these patients. Copyright © 2012 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4438" xmlns="http://purl.org/rss/1.0/"><title>Program impact evaluation using a matching method with panel data</title><link>http://dx.doi.org/10.1002%2Fsim.4438</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Program impact evaluation using a matching method with panel data</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Viet Cuong Nguyen</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4438</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4438</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4438</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">577</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">588</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>Difference-in-differences with matching is a popular method to measure the impact of an intervention in health and social sciences. This method requires baseline data, that is, data before interventions, which are not always available in reality. Instead, panel data with two time periods are often collected after interventions begin. In this paper, a simple matching method is proposed to measure the impact of an intervention using two-period panel data after the intervention. The method is illustrated by the measurement of the effect of health insurance in Vietnam using household panel data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>Difference-in-differences with matching is a popular method to measure the impact of an intervention in health and social sciences. This method requires baseline data, that is, data before interventions, which are not always available in reality. Instead, panel data with two time periods are often collected after interventions begin. In this paper, a simple matching method is proposed to measure the impact of an intervention using two-period panel data after the intervention. The method is illustrated by the measurement of the effect of health insurance in Vietnam using household panel data. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4456" xmlns="http://purl.org/rss/1.0/"><title>An autoregressive linear mixed effects model for the analysis of unequally spaced longitudinal data with dose-modification</title><link>http://dx.doi.org/10.1002%2Fsim.4456</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">An autoregressive linear mixed effects model for the analysis of unequally spaced longitudinal data with dose-modification</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Ikuko Funatogawa</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Takashi Funatogawa</dc:creator><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4456</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4456</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4456</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Research Article</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">589</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">599</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div class="para" xmlns:ol="http://www.wiley.com/namespaces/ol/xsl-lib" xmlns="http://www.w3.org/1999/xhtml"><p>The assessment of the dose–response relationship is important but not straightforward when the therapeutic agent is administered repeatedly with dose-modification in each patient and a continuous response is measured repeatedly. We recently proposed an autoregressive linear mixed effects model for such data in which the current response is regressed on the previous response, fixed effects, and random effects. The model represents profiles approaching each patient's asymptote, takes into account the past dose history, and provides a dose–response relationship of the asymptote as a summary measure. In an autoregressive model, intermittent missing data mean the missing values in previous responses as covariates. We previously provided the marginal (unconditional on the previous response) form of the proposed model to deal with intermittent missing data. Irregular timings of dose-modification or measurement can also be treated as equally spaced data with intermittent missing values by selecting an adequately small unit of time. The likelihood is, however, expressed by matrices whose sizes depend on the number of observations for a patient, and the computational burden is large. In this study, we propose a state space form of the autoregressive linear mixed effects model to calculate the marginal likelihood without using large matrices. The regression coefficients of the fixed effects can be concentrated out of the likelihood in this model by the same way of a linear mixed effects model. As an illustration of the approach, we analyzed immunologic data from a clinical trial for multiple sclerosis patients and estimated the dose–response curves for each patient and the population mean. Copyright © 2011 John Wiley &amp; Sons, Ltd.</p></div>]]></content:encoded><description>The assessment of the dose–response relationship is important but not straightforward when the therapeutic agent is administered repeatedly with dose-modification in each patient and a continuous response is measured repeatedly. We recently proposed an autoregressive linear mixed effects model for such data in which the current response is regressed on the previous response, fixed effects, and random effects. The model represents profiles approaching each patient's asymptote, takes into account the past dose history, and provides a dose–response relationship of the asymptote as a summary measure. In an autoregressive model, intermittent missing data mean the missing values in previous responses as covariates. We previously provided the marginal (unconditional on the previous response) form of the proposed model to deal with intermittent missing data. Irregular timings of dose-modification or measurement can also be treated as equally spaced data with intermittent missing values by selecting an adequately small unit of time. The likelihood is, however, expressed by matrices whose sizes depend on the number of observations for a patient, and the computational burden is large. In this study, we propose a state space form of the autoregressive linear mixed effects model to calculate the marginal likelihood without using large matrices. The regression coefficients of the fixed effects can be concentrated out of the likelihood in this model by the same way of a linear mixed effects model. As an illustration of the approach, we analyzed immunologic data from a clinical trial for multiple sclerosis patients and estimated the dose–response curves for each patient and the population mean. Copyright © 2011 John Wiley &amp; Sons, Ltd.</description></item><item rdf:about="http://dx.doi.org/10.1002%2Fsim.4436" xmlns="http://purl.org/rss/1.0/"><title>Correction: Evaluation metrics for biostatistical and epidemiological collaborations</title><link>http://dx.doi.org/10.1002%2Fsim.4436</link><dc:title xmlns:dc="http://purl.org/dc/elements/1.1/">Correction: Evaluation metrics for biostatistical and epidemiological collaborations</dc:title><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Doris McGartland Rubio</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Deborah J. del Junco</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Rafia Bhore</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Christopher J. Lindsell</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Robert A. Oster</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Knut M. Wittkowski</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Leah J. Welty</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Yi-Ju Li</dc:creator><dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2012-03-15T00:00:00-05:00</dc:date><dc:identifier xmlns:dc="http://purl.org/dc/elements/1.1/">doi:10.1002/sim.4436</dc:identifier><dc:rights xmlns:dc="http://purl.org/dc/elements/1.1/"/><dc:publisher xmlns:dc="http://purl.org/dc/elements/1.1/">John Wiley &amp; Sons, Inc.</dc:publisher><prism:doi xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">10.1002/sim.4436</prism:doi><prism:url xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">http://dx.doi.org/10.1002%2Fsim.4436</prism:url><prism:section xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">Erratum</prism:section><prism:startingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">600</prism:startingPage><prism:endingPage xmlns:prism="http://prismstandard.org/namespaces/1.2/basic/">600</prism:endingPage><content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[]]></content:encoded><description/></item></rdf:RDF>
