349 lines
15 KiB
Plaintext
Raw Permalink Normal View History

2025-01-12 00:52:51 +08:00
R Under development (unstable) (2019-05-15 r76504) -- "Unsuffered Consequences"
Copyright (C) 2019 The R Foundation for Statistical Computing
Platform: x86_64-pc-linux-gnu (64-bit)
R is free software and comes with ABSOLUTELY NO WARRANTY.
You are welcome to redistribute it under certain conditions.
Type 'license()' or 'licence()' for distribution details.
R is a collaborative project with many contributors.
Type 'contributors()' for more information and
'citation()' on how to cite R or R packages in publications.
Type 'demo()' for some demos, 'help()' for on-line help, or
'help.start()' for an HTML browser interface to help.
Type 'q()' to quit R.
> options(na.action=na.exclude) # preserve missings
> options(contrasts=c('contr.treatment', 'contr.poly')) #ensure constrast type
> library(survival)
>
> aeq <- function(x,y, ...) all.equal(as.vector(x), as.vector(y), ...)
>
> fit1 <- survreg(Surv(futime, fustat) ~ age + ecog.ps, ovarian)
> fit4 <- survreg(Surv(log(futime), fustat) ~age + ecog.ps, ovarian,
+ dist='extreme')
>
> print(fit1)
Call:
survreg(formula = Surv(futime, fustat) ~ age + ecog.ps, data = ovarian)
Coefficients:
(Intercept) age ecog.ps
12.28496723 -0.09702669 0.09977342
Scale= 0.6032744
Loglik(model)= -90 Loglik(intercept only)= -98
Chisq= 15.98 on 2 degrees of freedom, p= 0.000339
n= 26
> summary(fit4)
Call:
survreg(formula = Surv(log(futime), fustat) ~ age + ecog.ps,
data = ovarian, dist = "extreme")
Value Std. Error z p
(Intercept) 12.2850 1.5015 8.18 2.8e-16
age -0.0970 0.0235 -4.13 3.7e-05
ecog.ps 0.0998 0.3657 0.27 0.785
Log(scale) -0.5054 0.2351 -2.15 0.032
Scale= 0.603
Extreme value distribution
Loglik(model)= -21.8 Loglik(intercept only)= -29.8
Chisq= 15.98 on 2 degrees of freedom, p= 0.00034
Number of Newton-Raphson Iterations: 5
n= 26
>
>
> # Hypothesis (and I'm fairly sure): censorReg shares the fault of many
> # iterative codes -- it returns the loglik and variance for iteration k
> # but the coef vector of iteration k+1. Hence the "all.equal" tests
> # below don't come out perfect.
> #
> if (exists('censorReg')) { #true for Splus, not R
+ fit2 <- censorReg(censor(futime, fustat) ~ age + ecog.ps, ovarian)
+ fit3 <- survreg(Surv(futime, fustat) ~ age + ecog.ps, ovarian,
+ iter=0, init=c(fit2$coef, log(fit2$scale)))
+
+ aeq(resid(fit2, type='working')[,1], resid(fit3, type='working'))
+ aeq(resid(fit2, type='response')[,1], resid(fit3, type='response'))
+
+ temp <- sign(resid(fit3, type='working'))
+ aeq(resid(fit2, type='deviance')[,1],
+ temp*abs(resid(fit3, type='deviance')))
+ aeq(resid(fit2, type='deviance')[,1], resid(fit3, type='deviance'))
+ }
> #
> # Now check fit1 and fit4, which should follow identical iteration paths
> # These tests should all be true
> #
> aeq(fit1$coef, fit4$coef)
[1] TRUE
>
> resid(fit1, type='working')
1 2 3 4 5 6
-4.5081778 -0.5909810 -2.4878519 0.6032744 -5.8993431 0.6032744
7 8 9 10 11 12
-1.7462937 -0.8102883 0.6032744 -1.6593962 -0.8235265 0.6032744
13 14 15 16 17 18
0.6032744 0.6032744 0.6032744 0.6032744 0.6032744 0.6032744
19 20 21 22 23 24
0.6032744 0.6032744 0.6032744 0.2572623 -31.8006867 -0.7426277
25 26
-0.2857597 0.6032744
> resid(fit1, type='response')
1 2 3 4 5 6
-155.14523 -58.62744 -262.03173 -927.79842 -1377.84908 -658.86626
7 8 9 10 11 12
-589.74449 -318.93436 4.50671 -686.83338 -434.39281 -1105.68733
13 14 15 16 17 18
-42.43371 -173.09223 -4491.29974 -3170.49394 -5028.31053 -2050.91373
19 20 21 22 23 24
-150.65033 -2074.09345 412.32400 76.35826 -3309.40331 -219.81579
25 26
-96.19691 -457.76731
> resid(fit1, type='deviance')
1 2 3 4 5 6 7
-1.5842290 -0.6132746 -1.2876971 0.5387840 -1.7148539 0.6682580 -1.1102921
8 9 10 11 12 13 14
-0.7460191 1.4253843 -1.0849419 -0.7531720 0.6648130 1.3526380 1.1954382
15 16 17 18 19 20 21
0.2962391 0.3916044 0.3278067 0.5929057 1.2747643 0.6171130 1.9857606
22 23 24 25 26
0.6125492 -2.4504208 -0.7080652 -0.3642424 0.7317955
> resid(fit1, type='dfbeta')
[,1] [,2] [,3] [,4]
1 0.43370970 -1.087867e-02 0.126322520 0.048379059
2 0.14426449 -5.144770e-03 0.088768478 -0.033939677
3 0.25768057 -3.066698e-03 -0.066578834 0.021817646
4 0.05772598 -5.068044e-04 -0.013121427 -0.007762466
5 -0.58773456 6.676156e-03 0.084189274 0.008064026
6 0.01499533 -7.881949e-04 0.026570173 -0.013513160
7 -0.17869321 4.126121e-03 -0.072760519 -0.015006956
8 -0.11851540 2.520303e-03 -0.045549628 -0.035686269
9 0.08327656 3.206404e-03 -0.141835350 0.024490806
10 -0.25083921 5.321702e-03 -0.073986269 -0.020648720
11 -0.21333934 4.155746e-03 -0.049832434 -0.040215681
12 0.13889770 -1.586136e-03 -0.019701151 -0.004686340
13 0.07892133 -2.706713e-03 0.085242459 0.007847879
14 0.29690157 -1.987141e-03 -0.085553120 0.017447343
15 0.04344618 -6.319243e-04 -0.001944285 -0.003533279
16 0.04866809 -1.068317e-03 0.012398602 -0.006340983
17 0.04368104 -9.248316e-04 0.009428718 -0.004869178
18 0.15684611 -2.081485e-03 -0.013068320 -0.003265399
19 0.48839511 -4.775829e-03 -0.093258090 0.032703354
20 0.17598922 -2.349254e-03 -0.014202966 -0.002486428
21 0.37869758 -8.442011e-03 0.163476417 0.100850775
22 -0.59761427 8.803638e-03 0.052784598 -0.053085234
23 -0.79017984 1.092304e-02 0.053690092 0.080780399
24 -0.02348526 8.331002e-04 -0.039028433 -0.032765737
25 -0.13948485 3.687927e-04 0.056781884 -0.055647859
26 0.05778937 3.766350e-06 -0.029232389 -0.008927920
> resid(fit1, type='dfbetas')
[,1] [,2] [,3] [,4]
1 0.288846658 -0.4627232074 0.345395116 0.20574292
2 0.096078819 -0.2188323823 0.242713641 -0.14433617
3 0.171612884 -0.1304417700 -0.182041999 0.09278449
4 0.038444974 -0.0215568869 -0.035877029 -0.03301165
5 -0.391425795 0.2839697749 0.230193032 0.03429410
6 0.009986751 -0.0335258093 0.072649027 -0.05746778
7 -0.119008027 0.1755042532 -0.198944162 -0.06382048
8 -0.078930164 0.1072008799 -0.124543264 -0.15176395
9 0.055461420 0.1363841532 -0.387810796 0.10415271
10 -0.167056601 0.2263581990 -0.202295647 -0.08781336
11 -0.142082031 0.1767643342 -0.136253451 -0.17102630
12 0.092504589 -0.0674661531 -0.053867524 -0.01992972
13 0.052560878 -0.1151298322 0.233072686 0.03337488
14 0.197733705 -0.0845228882 -0.233922105 0.07419878
15 0.028934753 -0.0268788526 -0.005316126 -0.01502607
16 0.032412497 -0.0454407662 0.033900659 -0.02696647
17 0.029091172 -0.0393376416 0.025780305 -0.02070728
18 0.104458066 -0.0885357994 -0.035731824 -0.01388685
19 0.325266641 -0.2031395176 -0.254989284 0.13907843
20 0.117207199 -0.0999253459 -0.038834208 -0.01057410
21 0.252209096 -0.3590802699 0.446982501 0.42889079
22 -0.398005596 0.3744620571 0.144325354 -0.22575700
23 -0.526252483 0.4646108448 0.146801184 0.34353696
24 -0.015640965 0.0354358527 -0.106712804 -0.13934372
25 -0.092895624 0.0156865706 0.155254862 -0.23665514
26 0.038487186 0.0001602014 -0.079928144 -0.03796800
> resid(fit1, type='ldcase')
1 2 3 4 5 6
0.374432175 0.145690278 0.112678800 0.006399163 0.261176992 0.013280058
7 8 9 10 11 12
0.109842490 0.074103234 0.248285282 0.128482147 0.094038203 0.016111951
13 14 15 16 17 18
0.132812463 0.111857574 0.001698300 0.004730718 0.003131173 0.015840667
19 20 21 22 23 24
0.179925399 0.019071941 0.797119488 0.233096445 0.666613755 0.062959708
25 26
0.080117437 0.015922378
> resid(fit1, type='ldresp')
1 2 3 4 5 6
0.076910173 0.173810883 0.078356928 0.005310644 0.060742612 0.010002154
7 8 9 10 11 12
0.067356838 0.067065693 0.355103899 0.067043195 0.068142828 0.016740944
13 14 15 16 17 18
0.193444572 0.165021262 0.001494685 0.004083386 0.002767560 0.016400993
19 20 21 22 23 24
0.269571809 0.020129806 1.409736499 1.040266083 0.058637282 0.071819025
25 26
0.112702844 0.015105534
> resid(fit1, type='ldshape')
1 2 3 4 5 6
0.870628250 0.383362440 0.412503605 0.005534970 0.513991064 0.003310847
7 8 9 10 11 12
0.291860593 0.154910362 0.256160646 0.312329770 0.183191309 0.004184904
13 14 15 16 17 18
0.110215710 0.049299495 0.007678445 0.011633336 0.011588605 0.008641251
19 20 21 22 23 24
0.112967758 0.008271358 2.246729275 0.966929220 1.022043272 0.143857170
25 26
0.079754096 0.001606647
> resid(fit1, type='matrix')
g dg ddg ds dds dsg
1 -1.74950763 -1.46198129 -0.32429540 0.88466493 -2.42358635 1.8800360
2 -0.68266980 -0.82027857 -1.38799493 -0.66206188 -0.57351872 1.3921043
3 -1.32369884 -1.33411374 -0.53625126 0.31503768 -1.83606321 1.8626973
4 -0.14514412 0.24059386 -0.39881329 -0.28013223 -0.26053084 0.2237590
5 -1.96497889 -1.50383619 -0.25491587 1.15700933 -2.68145423 1.8694717
6 -0.22328436 0.37012071 -0.61351964 -0.33477229 -0.16715487 0.1848047
7 -1.11099124 -1.23201028 -0.70550005 0.01052036 -1.48515401 1.8106760
8 -0.77288913 -0.95018808 -1.17265428 -0.51190170 -0.79753045 1.5525642
9 -1.01586016 1.68391053 -2.79128447 0.01598527 -0.01623681 -1.7104080
10 -1.08316634 -1.21566480 -0.73259465 -0.03052447 -1.43539383 1.7998987
11 -0.77825093 -0.95675178 -1.16177415 -0.50314979 -0.81016011 1.5600720
12 -0.22098818 0.36631452 -0.60721042 -0.33361394 -0.17002503 0.1866908
13 -0.91481479 1.51641567 -2.51364157 -0.08144930 0.07419757 -1.3814037
14 -0.71453621 1.18442981 -1.96333502 -0.24017106 0.15944438 -0.7863174
15 -0.04387880 0.07273440 -0.12056602 -0.13717935 -0.29168773 0.1546569
16 -0.07667699 0.12710134 -0.21068577 -0.19691828 -0.30879813 0.1993144
17 -0.05372862 0.08906165 -0.14763041 -0.15709224 -0.30221555 0.1713377
18 -0.17576861 0.29135764 -0.48296037 -0.30558900 -0.22570402 0.2151929
19 -0.81251205 1.34683655 -2.23254376 -0.16869744 0.13367171 -1.0672002
20 -0.19041424 0.31563454 -0.52320225 -0.31581218 -0.20797917 0.2078622
21 -1.97162252 3.26820173 -5.41743790 1.33844939 -2.24706488 -5.4868428
22 -0.68222519 1.23245193 -4.79064290 -0.58668577 -0.95209805 -2.8390386
23 -3.49689798 -1.62675999 -0.05115487 2.90949868 -4.20494743 1.7496975
24 -0.74529506 -0.91462436 -1.23160543 -0.55723389 -0.73139169 1.5108398
25 -0.56095318 -0.53280415 -1.86451840 -0.87536233 -0.22666819 0.9689667
26 -0.26776235 0.44384834 -0.73573207 -0.35281852 -0.11207472 0.1409908
>
> aeq(resid(fit1, type='working'),resid(fit4, type='working'))
[1] TRUE
> #aeq(resid(fit1, type='response'), resid(fit4, type='response'))#should differ
> aeq(resid(fit1, type='deviance'), resid(fit4, type='deviance'))
[1] TRUE
> aeq(resid(fit1, type='dfbeta'), resid(fit4, type='dfbeta'))
[1] TRUE
> aeq(resid(fit1, type='dfbetas'), resid(fit4, type='dfbetas'))
[1] TRUE
> aeq(resid(fit1, type='ldcase'), resid(fit4, type='ldcase'))
[1] TRUE
> aeq(resid(fit1, type='ldresp'), resid(fit4, type='ldresp'))
[1] TRUE
> aeq(resid(fit1, type='ldshape'), resid(fit4, type='ldshape'))
[1] TRUE
> aeq(resid(fit1, type='matrix'), resid(fit4, type='matrix'))
[1] TRUE
> #
> # Some tests of the quantile residuals
> #
> # These should agree exactly with Ripley and Venables' book
> fit1 <- survreg(Surv(time, status) ~ temp, data=imotor)
> summary(fit1)
Call:
survreg(formula = Surv(time, status) ~ temp, data = imotor)
Value Std. Error z p
(Intercept) 16.31852 0.62296 26.2 < 2e-16
temp -0.04531 0.00319 -14.2 < 2e-16
Log(scale) -1.09564 0.21480 -5.1 3.4e-07
Scale= 0.334
Weibull distribution
Loglik(model)= -147.4 Loglik(intercept only)= -169.5
Chisq= 44.32 on 1 degrees of freedom, p= 2.8e-11
Number of Newton-Raphson Iterations: 7
n= 40
>
> #
> # The first prediction has the SE that I think is correct
> # The third is the se found in an early draft of Ripley; fit1 ignoring
> # the variation in scale estimate, except via it's impact on the
> # upper left corner of the inverse information matrix.
> # Numbers 1 and 3 differ little for this dataset
> #
> predict(fit1, data.frame(temp=130), type='uquantile', p=c(.5, .1), se=T)
$fit
[1] 10.306068 9.676248
$se.fit
[1] 0.2135247 0.2202088
>
> fit2 <- survreg(Surv(time, status) ~ temp, data=imotor, scale=fit1$scale)
> predict(fit2, data.frame(temp=130), type='uquantile', p=c(.5, .1), se=T)
$fit
[1] 10.306068 9.676248
$se.fit
1 1
0.2057964 0.2057964
>
> fit3 <- fit2
> fit3$var <- fit1$var[1:2,1:2]
> predict(fit3, data.frame(temp=130), type='uquantile', p=c(.5, .1), se=T)
$fit
[1] 10.306068 9.676248
$se.fit
1 1
0.2219959 0.2219959
>
> pp <- seq(.05, .7, length=40)
> xx <- predict(fit1, data.frame(temp=130), type='uquantile', se=T,
+ p=pp)
> #matplot(pp, cbind(xx$fit, xx$fit+2*xx$se, xx$fit - 2*xx$se), type='l')
>
>
> #
> # Now try out the various combinations of strata, #predicted, and
> # number of quantiles desired
> #
> fit1 <- survreg(Surv(time, status) ~ inst + strata(inst) + age + sex, lung)
> qq1 <- predict(fit1, type='quantile', p=.3, se=T)
> qq2 <- predict(fit1, type='quantile', p=c(.2, .3, .4), se=T)
> aeq <- function(x,y) all.equal(as.vector(x), as.vector(y))
> aeq(qq1$fit, qq2$fit[,2])
[1] TRUE
> aeq(qq1$se.fit, qq2$se.fit[,2])
[1] TRUE
>
> qq3 <- predict(fit1, type='quantile', p=c(.2, .3, .4), se=T,
+ newdata= lung[1:5,])
> aeq(qq3$fit, qq2$fit[1:5,])
[1] TRUE
>
> qq4 <- predict(fit1, type='quantile', p=c(.2, .3, .4), se=T, newdata=lung[7,])
> aeq(qq4$fit, qq2$fit[7,])
[1] TRUE
>
> qq5 <- predict(fit1, type='quantile', p=c(.2, .3, .4), se=T, newdata=lung)
> aeq(qq2$fit, qq5$fit)
[1] TRUE
> aeq(qq2$se.fit, qq5$se.fit)
[1] TRUE
>
> proc.time()
user system elapsed
0.796 0.044 0.845