## ## RNG tests using DKW inequality for rate of convergence ## ## P(sup | F_n - F | > t) < 2 exp(-2nt^2) ## ## The 2 in front of exp() was derived by Massart. It is the best possible ## constant valid uniformly in t,n,F. For large n*t^2 this agrees with the ## large-sample approximation to the Kolmogorov-Smirnov statistic. ## ## When tryCatch()ing all seeds in 0:10000, the following 346 failed (Lnx 64b, R 3.5.0): suppressWarnings(RNGversion("3.5.0")) failingSeeds <- c( 16, 42, 51, 63, 79, 108, 143, 171, 208, 215, 230, 236, 254, 323, 327, 332, 333, 374, 386, 387, 438, 440, 450, 472, 547, 609, 673, 740, 784, 787, 792, 806, 846, 897, 938, 1017,1043,1062,1067,1076, 1090,1113,1115,1136,1142, 1148,1162,1193,1249,1259, 1299,1338,1347,1366,1407, 1428,1457,1461,1540,1609, 1613,1622,1629,1664,1712, 1760,1779,1786,1826,1852, 1868,1871,1880,1928,1930, 1978,1984,2025,2073,2081, 2082,2130,2148,2153,2172, 2175,2228,2298,2353,2368, 2430,2444,2462,2493,2528, 2631,2750,2752,2765,2774, 2794,2817,2873,2888,2905, 2906,2911,2936,2955,2989, 3029,3048,3053,3084,3100, 3148,3183,3192,3232,3256, 3266,3302,3311,3313,3319, 3325,3340,3344,3375,3477, 3506,3516,3518,3521,3553, 3601,3655,3717,3733,3810, 3814,3962,4043,4095,4119, 4174,4185,4192,4228,4240, 4261,4298,4335,4338,4349, 4402,4433,4461,4491,4496, 4508,4511,4530,4604,4622, 4640,4669,4677,4682,4683, 4705,4717,4725,4757,4816, 4899,4931,5014,5022,5063, 5082,5105,5107,5137,5155, 5160,5165,5169,5182,5186, 5197,5207,5210,5211,5263, 5281,5282,5288,5364,5529, 5568,5611,5651,5700,5740, 5796,5869,5874,5878,5920, 5954,5972,6034,6037,6073, 6086,6118,6120,6126,6234, 6235,6263,6287,6301,6360, 6364,6377,6416,6491,6493, 6524,6534,6568,6615,6679, 6682,6777,6782,6790,6808, 6885,6887,6936,6938,6961, 7011,7046,7047,7062,7111, 7181,7202,7206,7207,7227, 7261,7301,7311,7313,7324, 7364,7385,7394,7412,7486, 7504,7519,7536,7584,7665, 7692,7762,7787,7797,7865, 7916,7959,7967,8038,8047, 8048,8086,8123,8125,8160, 8213,8243,8254,8255,8307, 8335,8403,8453,8487,8541, 8549,8577,8587,8638,8640, 8651,8664,8703,8770,8781, 8793,8841,8888,8900,8962, 8963,8965,9028,9052,9054, 9061,9143,9198,9204,9232, 9238,9247,9308,9311,9321, 9342,9360,9430,9457,9564, 9572,9609,9657,9738,9743, 9750,9758,9779,9789,9848, 9881,9895,9903,9905,9947, 9982) ## randomly setting one of the valid 10001-346 = 9655 seeds: iseed <- sample(setdiff(0:10000, failingSeeds), size=1) dump("iseed", file="p-r-random-tests_seed") #(for reproducibility, not into *.Rout) set.seed(iseed) superror <- function(rfoo,pfoo,sample.size,...) { x <- rfoo(sample.size,...) tx <- table(signif(x, 12)) # such that xi will be sort(unique(x)) xi <- as.numeric(names(tx)) f <- pfoo(xi,...) fhat <- cumsum(tx)/sample.size max(abs(fhat-f)) } pdkwbound <- function(n,t) 2*exp(-2*n*t*t) qdkwbound <- function(n,p) sqrt(log(p/2)/(-2*n)) dkwtest <- function(stub = "norm", ..., sample.size = 10000, pthreshold = 0.001, print.result = TRUE, print.detail = FALSE, stop.on.failure = TRUE) { rfoo <- eval(as.name(paste("r", stub, sep=""))) pfoo <- eval(as.name(paste("p", stub, sep=""))) s <- superror(rfoo, pfoo, sample.size, ...) if (print.result || print.detail) { printargs <- substitute(list(...)) printargs[[1]] <- as.name(stub) cat(deparse(printargs)) if (print.detail) cat("\nsupremum error = ",signif(s,2), " with p-value=",min(1,round(pdkwbound(sample.size,s),4)),"\n") } rval <- (s < qdkwbound(sample.size,pthreshold)) if (print.result) cat(c(" FAILED\n"," PASSED\n")[rval+1]) if (stop.on.failure && !rval) stop("dkwtest failed") rval } .proctime00 <- proc.time() # start timing dkwtest("binom",size = 1,prob = 0.2) dkwtest("binom",size = 2,prob = 0.2) dkwtest("binom",size = 100,prob = 0.2) dkwtest("binom",size = 1e4,prob = 0.2) dkwtest("binom",size = 1,prob = 0.8) dkwtest("binom",size = 100,prob = 0.8) dkwtest("binom",size = 100,prob = 0.999) dkwtest("pois",lambda = 0.095) dkwtest("pois",lambda = 0.95) dkwtest("pois",lambda = 9.5) dkwtest("pois",lambda = 95) dkwtest("nbinom",size = 1,prob = 0.2) dkwtest("nbinom",size = 2,prob = 0.2) dkwtest("nbinom",size = 100,prob = 0.2) dkwtest("nbinom",size = 1e4,prob = 0.2) dkwtest("nbinom",size = 1,prob = 0.8) dkwtest("nbinom",size = 100,prob = 0.8) dkwtest("nbinom",size = 100,prob = 0.999) dkwtest("norm") dkwtest("norm",mean = 5,sd = 3) dkwtest("gamma",shape = 0.1) dkwtest("gamma",shape = 0.2) dkwtest("gamma",shape = 10) dkwtest("gamma",shape = 20) dkwtest("hyper",m = 40,n = 30,k = 20) dkwtest("hyper",m = 40,n = 3,k = 20) dkwtest("hyper",m = 6,n = 3,k = 2) dkwtest("hyper",m = 5,n = 3,k = 2) dkwtest("hyper",m = 4,n = 3,k = 2) dkwtest("signrank",n = 1) dkwtest("signrank",n = 2) dkwtest("signrank",n = 10) dkwtest("signrank",n = 30) dkwtest("wilcox",m = 40,n = 30) dkwtest("wilcox",m = 40,n = 10) dkwtest("wilcox",m = 6,n = 3) dkwtest("wilcox",m = 5,n = 3) dkwtest("wilcox",m = 4,n = 3) dkwtest("chisq",df = 1) dkwtest("chisq",df = 10) dkwtest("logis") dkwtest("logis",location = 4,scale = 2) dkwtest("t",df = 1) dkwtest("t",df = 10) dkwtest("t",df = 40) dkwtest("beta",shape1 = 1, shape2 = 1) dkwtest("beta",shape1 = 2, shape2 = 1) dkwtest("beta",shape1 = 1, shape2 = 2) dkwtest("beta",shape1 = 2, shape2 = 2) dkwtest("beta",shape1 = .2,shape2 = .2) dkwtest("cauchy") dkwtest("cauchy",location = 4,scale = 2) dkwtest("f",df1 = 1,df2 = 1) dkwtest("f",df1 = 1,df2 = 10) dkwtest("f",df1 = 10,df2 = 10) dkwtest("f",df1 = 30,df2 = 3) dkwtest("weibull",shape = 1) dkwtest("weibull",shape = 4,scale = 4) ## regression test for PR#7314 dkwtest("hyper", m=60, n=100, k=50) dkwtest("hyper", m=6, n=10, k=5) dkwtest("hyper", m=600, n=1000, k=500) ## regression test for non-central t bug dkwtest("t", df=20, ncp=3) ## regression test for non-central F bug dkwtest("f", df1=10, df2=2, ncp=3) cat('Time elapsed: ', proc.time() - .proctime00,'\n')