@techreport{873c7c3cf0b4476ebf57493411313768,
title = "Safe Testing",
abstract = "We develop the theory of hypothesis testing based on the e-value, a notion of evidence that, unlike the p-value, allows for effortlessly combining results from several studies in the common scenario where the decision to perform a new study may depend on previous outcomes. Tests based on e-values are safe, i.e. they preserve Type-I error guarantees, under such optional continuation. We define growth-rate optimality (GRO) as an analogue of power in an optional continuation context, and we show how to construct GRO e-variables for general testing problems with composite null and alternative, emphasizing models with nuisance parameters. GRO e-values take the form of Bayes factors with special priors. We illustrate the theory using several classic examples including a one-sample safe t-test and the 2 x 2 contingency table. Sharing Fisherian, Neymanian and Jeffreys-Bayesian interpretations, e-values may provide a methodology acceptable to adherents of all three schools. ",
keywords = "math.ST, cs.IT, cs.LG, math.IT, stat.ME, stat.TH",
author = "Peter Gr{\"u}nwald and {de Heide}, Rianne and Koolen, {Wouter M.}",
note = "Accepted as discussion paper to the Journal of the Royal Statistical Society series B",
year = "2019",
month = jun,
day = "18",
doi = "10.48550/arXiv.1906.07801",
language = "English",
publisher = "ArXiv.org",
type = "WorkingPaper",
institution = "ArXiv.org",
}