@article{MTMT:35309767, title = {Estimation in a general mixture of Markov jump processes}, url = {https://m2.mtmt.hu/api/publication/35309767}, author = {Frydman, Halina and Surya, Budhi Arta}, doi = {10.1002/cjs.11814}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {35309767}, issn = {0319-5724}, keywords = {HETEROGENEITY; Fisher information matrix; EM algorithm; mixture of Markov jump processes}, year = {2024}, eissn = {1708-945X} } @article{MTMT:35269990, title = {Tests for the first-order stochastic dominance}, url = {https://m2.mtmt.hu/api/publication/35269990}, author = {Zhuang, Weiwei and Wang, Peiming and Chen, Jiahua}, doi = {10.1002/cjs.11811}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {35269990}, issn = {0319-5724}, keywords = {Brownian bridge; Bootstrap; empirical process; Stochastic dominance; Asymptotic test; frontal configurations}, year = {2024}, eissn = {1708-945X}, orcid-numbers = {Chen, Jiahua/0000-0001-8064-4444} } @article{MTMT:34886789, title = {A stable and adaptive polygenic signal detection method based on repeated sample splitting}, url = {https://m2.mtmt.hu/api/publication/34886789}, author = {Zhao, Y. and Sun, L.}, doi = {10.1002/cjs.11768}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, volume = {52}, unique-id = {34886789}, issn = {0319-5724}, year = {2024}, eissn = {1708-945X}, pages = {79-97} } @article{MTMT:34314200, title = {Football group draw probabilities and corrections}, url = {https://m2.mtmt.hu/api/publication/34314200}, author = {Roberts, Gareth O. and Rosenthal, Jeffrey S.}, doi = {10.1002/cjs.11798}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {34314200}, issn = {0319-5724}, abstract = {This article considers the challenge of designing football group draw mechanisms, which have a uniform distribution over all valid draw assignments, but are also entertaining, practical and transparent. Although this problem is trivial in completely symmetric problems, it becomes challenging when there are draw constraints that are not exchangeable across each of the competing teams, so that symmetry breaks down. We explain how to simulate the FIFA sequential draw method and compute the nonuniformity of its draws by comparison with a uniform rejection sampler. We then propose several practical methods of achieving the uniform distribution while still using balls and bowls in a way which is suitable for a televised draw. The solutions can also be carried out interactively. The general methodology we provide can readily be transported to different competition draws and is not restricted to football events.}, year = {2023}, eissn = {1708-945X}, orcid-numbers = {Rosenthal, Jeffrey S./0000-0002-5118-6808} } @article{MTMT:33244338, title = {Dynamic treatment regimes with interference}, url = {https://m2.mtmt.hu/api/publication/33244338}, author = {Jiang, Cong and Wallace, Michael P. and Thompson, Mary E.}, doi = {10.1002/cjs.11702}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {33244338}, issn = {0319-5724}, abstract = {Precision medicine describes health care where patient-level data are used to inform treatment decisions. Within this framework, dynamic treatment regimes (DTRs) are sequences of decision rules that take individual patient information as input data and then output treatment recommendations. DTR estimation from observational data typically relies on the assumption of no interference: i.e., the outcome of one individual is unaffected by the treatment assignment of others. However, in many social network contexts, such as friendship or family networks, and for many health concerns, such as infectious diseases, this assumption is questionable. We investigate the DTR estimation method of dynamic weighted ordinary least squares (dWOLS), which boasts of easy implementation and the so-called double-robustness property, but relies on the assumption of no interference. We define a network propensity function and build on it to establish an implementation of dWOLS that remains doubly robust under interference associated with network links. The method's properties are demonstrated via simulation and applied to data from the Population Assessment of Tobacco and Health (PATH) study to investigate cigarette dependence within two-person household networks.}, keywords = {INTERFERENCE; dynamic treatment regimes; Double robustness; dynamic weighted ordinary least squares; population assessment of tobacco and health}, year = {2022}, eissn = {1708-945X} } @article{MTMT:33244076, title = {Asymptotic theory in bipartite graph models with a growing number of parameters}, url = {https://m2.mtmt.hu/api/publication/33244076}, author = {Fan, Yifan and Jiang, Binyan and Yan, Ting and Zhang, Yuan}, doi = {10.1002/cjs.11735}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {33244076}, issn = {0319-5724}, abstract = {Affiliation networks contain a set of actors and a set of events, where edges denote the affiliation relationships between actors and events. Here, we introduce a class of affiliation network models for modelling the degree heterogeneity, where two sets of degree parameters are used to measure the activeness of actors and the popularity of events, respectively. We develop the moment method to infer these degree parameters. We establish a unified theoretical framework in which the consistency and asymptotic normality of the moment estimator hold as the numbers of actors and events both go to infinity. We apply our results to several popular models with weighted edges, including generalized beta-, Poisson and Rayleigh models. Simulation studies and a realistic example that involves the Poisson model provide concrete evidence that supports our theoretical findings.}, keywords = {Bipartite graphs; Asymptotic properties; Moment estimation; Node degrees}, year = {2022}, eissn = {1708-945X} } @article{MTMT:33158499, title = {A random walk through Canadian contributions on empirical processes and their applications in probability and statistics}, url = {https://m2.mtmt.hu/api/publication/33158499}, author = {Csorg, Miklos and Dawson, Donald A. and Nasri, Bouchra R. and Remillard, Bruno N.}, doi = {10.1002/cjs.11730}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, unique-id = {33158499}, issn = {0319-5724}, abstract = {In this article, we present a review of important results and statistical applications obtained or generalized by Canadian pioneers and their collaborators, for empirical processes of independent and identically distributed observations, pseudo-observations, and time series. In particular, we consider weak convergence and strong approximations results, as well as tests for model adequacy such as tests of independence, tests of goodness-of-fit, tests of change point, and tests of serial dependence for time series. We also consider applications of empirical processes of interacting particle systems for the approximation of measure-valued processes.}, keywords = {Time series; Copulas; empirical process; strong approximation; Change point; Goodness-of-fit; Measure-valued process; Generalized error models; McKean-Vlasov; Fleming-Viot; super Brownian motion}, year = {2022}, eissn = {1708-945X} } @article{MTMT:33389460, title = {A generalized single-index linear threshold model for identifying treatment-sensitive subsets based on multiple covariates and longitudinal measurements}, url = {https://m2.mtmt.hu/api/publication/33389460}, author = {Ge, Xinyi and Peng, Yingwei and Tu, Dongsheng}, doi = {10.1002/cjs.11737}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, volume = {51}, unique-id = {33389460}, issn = {0319-5724}, abstract = {Identification of a subset of patients who may be sensitive to a specific treatment is an important step towards personalized medicine. We consider the case where the effect of a treatment is assessed by longitudinal measurements, which may be continuous or categorical, such as quality of life scores assessed over the duration of a clinical trial. We assume that multiple baseline covariates, such as age and expression levels of genes, are available, and propose a generalized single-index linear threshold model to identify the treatment-sensitive subset and assess the treatment-by-subset interaction after combining these covariates. Because the model involves an indicator function with unknown parameters, conventional procedures are difficult to apply for inferences of the parameters in the model. We define smoothed generalized estimating equations and propose an inference procedure based on these equations with an efficient spectral algorithm to find their solutions. The proposed procedure is evaluated through simulation studies and an application to the analysis of data from a randomized clinical trial in advanced pancreatic cancer.}, keywords = {Clinical studies; longitudinal data; Predictive markers; Generalized linear model; Repeated measurements; combination of covariates}, year = {2022}, eissn = {1708-945X}, pages = {1171-1189}, orcid-numbers = {Tu, Dongsheng/0000-0003-4842-2184} } @article{MTMT:33317621, title = {Complex statistical modelling for phylogenetic inference}, url = {https://m2.mtmt.hu/api/publication/33317621}, author = {Susko, E.}, doi = {10.1002/cjs.11741}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, volume = {50}, unique-id = {33317621}, issn = {0319-5724}, year = {2022}, eissn = {1708-945X}, pages = {1339-1354} } @article{MTMT:33177590, title = {Extended Bayesian endemic-epidemic models to incorporate mobility data into COVID-19 forecasting}, url = {https://m2.mtmt.hu/api/publication/33177590}, author = {Douwes-Schultz, Dirk and Sun, Shuo and Schmidt, Alexandra M. and Moodie, Erica E. M.}, doi = {10.1002/cjs.11723}, journal-iso = {CAN J STAT}, journal = {CANADIAN JOURNAL OF STATISTICS / REVUE CANADIENNE DE STATISTIQUE}, volume = {50}, unique-id = {33177590}, issn = {0319-5724}, abstract = {Forecasting the number of daily COVID-19 cases is critical in the short-term planning of hospital and other public resources. One potentially important piece of information for forecasting COVID-19 cases is mobile device location data that measure the amount of time an individual spends at home. Endemic-epidemic (EE) time series models are recently proposed autoregressive models where the current mean case count is modelled as a weighted average of past case counts multiplied by an autoregressive rate, plus an endemic component. We extend EE models to include a distributed-lag model in order to investigate the association between mobility and the number of reported COVID-19 cases; we additionally include a weekly first-order random walk to capture additional temporal variation. Further, we introduce a shifted negative binomial weighting scheme for the past counts that is more flexible than previously proposed weighting schemes. We perform inference under a Bayesian framework to incorporate parameter uncertainty into model forecasts. We illustrate our methods using data from four US counties.}, keywords = {Time series; autoregressive model; Bayesian prediction; distributed-lag model}, year = {2022}, eissn = {1708-945X}, pages = {713-733}, orcid-numbers = {Sun, Shuo/0000-0002-4170-9388} }