243 lines
8.3 KiB
Plaintext
Raw Normal View History

2025-01-12 00:52:51 +08:00
R Under development (unstable) (2021-04-20 r80202) -- "Unsuffered Consequences"
Copyright (C) 2021 The R Foundation for Statistical Computing
Platform: x86_64-pc-linux-gnu (64-bit)
R is free software and comes with ABSOLUTELY NO WARRANTY.
You are welcome to redistribute it under certain conditions.
Type 'license()' or 'licence()' for distribution details.
R is a collaborative project with many contributors.
Type 'contributors()' for more information and
'citation()' on how to cite R or R packages in publications.
Type 'demo()' for some demos, 'help()' for on-line help, or
'help.start()' for an HTML browser interface to help.
Type 'q()' to quit R.
> library(survival)
> aeq <- function(x, y, ...) all.equal(as.vector(x), as.vector(y), ...)
>
> # Check that estimates from a multi-state model agree with single state models
> # Use a simplified version of the myeloid data set
> tdata <- tmerge(myeloid[,1:3], myeloid, id=id, death=event(futime,death),
+ priortx = tdc(txtime), sct= event(txtime))
> tdata$event <- factor(with(tdata, sct + 2*death), 0:2,
+ c("censor", "sct", "death"))
> fit <- coxph(Surv(tstart, tstop, event) ~ trt + sex, tdata, id=id,
+ iter=4, x=TRUE, robust=FALSE)
>
> fit12 <- coxph(Surv(tstart, tstop, event=='sct') ~ trt + sex, tdata,
+ subset=(priortx==0), iter=4, x=TRUE)
> fit13 <- coxph(Surv(tstart, tstop, event=='death') ~ trt + sex, tdata,
+ subset=(priortx==0), iter=4, x=TRUE)
> fit23 <- coxph(Surv(tstart, tstop, event=='death') ~ trt + sex, tdata,
+ subset=(priortx==1), iter=4, x=TRUE)
> aeq(coef(fit), c(coef(fit12), coef(fit13), coef(fit23)))
[1] TRUE
> aeq(fit$loglik, fit12$loglik + fit13$loglik + fit23$loglik)
[1] TRUE
> temp <- matrix(0, 6,6)
> temp[1:2, 1:2] <- fit12$var
> temp[3:4, 3:4] <- fit13$var
> temp[5:6, 5:6] <- fit23$var
> aeq(fit$var, temp)
[1] TRUE
>
> # check out model.frame
> fita <- coxph(Surv(tstart, tstop, event) ~ trt, tdata, id=id)
> fitb <- coxph(Surv(tstart, tstop, event) ~ trt, tdata, id=id, model=TRUE)
> all.equal(model.frame(fita), fitb$model)
[1] "Component \"trt\": 'current' is not a factor"
> # model.frame fails due to an interal rule in R, factors vs characters
> # result when the xlev arg is in the call. So model.frame(fita) has trt
> # as a factor, not character.
>
> #check residuals
> indx1 <- which(fit$rmap[,2] ==1)
> indx2 <- which(fit$rmap[,2] ==2)
> indx3 <- which(fit$rmap[,2] ==3)
> aeq(residuals(fit), c(residuals(fit12), residuals(fit13), residuals(fit23)))
[1] TRUE
> aeq(residuals(fit)[indx1], residuals(fit12))
[1] TRUE
> aeq(residuals(fit)[indx2], residuals(fit13))
[1] TRUE
> aeq(residuals(fit)[indx3], residuals(fit23))
[1] TRUE
>
> # score residuals
> temp <- residuals(fit, type='score')
> aeq(temp[indx1, 1:2], residuals(fit12, type='score'))
[1] TRUE
> aeq(temp[indx2, 3:4], residuals(fit13, type='score'))
[1] TRUE
> aeq(temp[indx3, 5:6], residuals(fit23, type='score'))
[1] TRUE
>
> all(temp[indx1, 3:6] ==0)
[1] TRUE
> all(temp[indx2, c(1,2,5,6)] ==0)
[1] TRUE
> all(temp[indx3, 1:4]==0)
[1] TRUE
>
> temp <- residuals(fit, type="dfbeta")
> all(temp[indx1, 3:6] ==0)
[1] TRUE
> all(temp[indx2, c(1,2,5,6)] ==0)
[1] TRUE
> all(temp[indx3, 1:4]==0)
[1] TRUE
> aeq(temp[indx1, 1:2], residuals(fit12, type='dfbeta'))
[1] TRUE
> aeq(temp[indx2, 3:4], residuals(fit13, type='dfbeta'))
[1] TRUE
> aeq(temp[indx3, 5:6], residuals(fit23, type='dfbeta'))
[1] TRUE
>
> temp <- residuals(fit, type="dfbetas")
> all(temp[indx1, 3:6] ==0)
[1] TRUE
> all(temp[indx2, c(1,2,5,6)] ==0)
[1] TRUE
> all(temp[indx3, 1:4]==0)
[1] TRUE
> aeq(temp[indx1, 1:2], residuals(fit12, type='dfbetas'))
[1] TRUE
> aeq(temp[indx2, 3:4], residuals(fit13, type='dfbetas'))
[1] TRUE
> aeq(temp[indx3, 5:6], residuals(fit23, type='dfbetas'))
[1] TRUE
>
> # Schoenfeld and scaled shoenfeld have one row per event
> sr1 <- residuals(fit12, type="schoenfeld")
> sr2 <- residuals(fit13, type="schoenfeld")
> sr3 <- residuals(fit23, type="schoenfeld")
> end <- rep(1:3, c(nrow(sr1), nrow(sr2), nrow(sr3)))
> temp <- residuals(fit, type="schoenfeld")
> aeq(temp[end==1, 1:2], sr1)
[1] TRUE
> aeq(temp[end==2, 3:4], sr2)
[1] TRUE
> aeq(temp[end==3, 5:6], sr3)
[1] TRUE
> all(temp[end==1, 3:6] ==0)
[1] TRUE
> all(temp[end==2, c(1,2,5,6)] ==0)
[1] TRUE
> all(temp[end==3, 1:4] ==0)
[1] TRUE
>
>
> #The scaled Schoenfeld don't agree, due to the use of a robust
> # variance in fit, regular variance in fit12, fit13 and fit23
> #Along with being scaled by different event counts
> xfit <- fit
> xfit$var <- xfit$naive.var
> if (FALSE) {
+ xfit <- fit
+ xfit$var <- xfit$naive.var # fixes the first issue
+ temp <- residuals(xfit, type="scaledsch")
+ aeq(d1* temp[sindx1, 1:2], residuals(fit12, type='scaledsch'))
+ aeq(temp[sindx2, 3:4], residuals(fit13, type='scaledsch'))
+ aeq(temp[sindx3, 5:6], residuals(fit23, type='scaledsch'))
+ }
>
> if (FALSE) { # the predicted values are a work in progress
+ # predicted values differ because of different centering
+ c0 <- sum(fit$mean * coef(fit))
+ c12 <- sum(fit12$mean * coef(fit12))
+ c13 <- sum(fit13$mean* coef(fit13))
+ c23 <- sum(fit23$mean * coef(fit23))
+
+ aeq(predict(fit)+c0, c(predict(fit12)+c12, predict(fit13)+c13,
+ predict(fit23)+c23))
+ aeq(exp(predict(fit)), predict(fit, type='risk'))
+
+ # expected survival is independent of centering
+ aeq(predict(fit, type="expected"), c(predict(fit12, type="expected"),
+ predict(fit13, type="expected"),
+ predict(fit23, type="expected")))
+ }
> # predict(type='terms') is a matrix, centering changes as well
> if (FALSE) {
+ temp <- predict(fit, type='terms')
+ all(temp[indx1, 3:6] ==0)
+ all(temp[indx2, c(1,2,5,6)] ==0)
+ all(temp[indx3, 1:4]==0)
+ aeq(temp[indx1, 1:2], predict(fit12, type='terms'))
+ aeq(temp[indx2, 3:4], predict(fit13, type='terms'))
+ aeq(temp[indx3, 5:6], predict(fit23, type='terms'))
+ } # end of prediction section
>
> # The global and per strata zph tests will differ for the KM or rank
> # transform, because the overall and subset will have a different list
> # of event times, which changes the transformed value for all of them.
> # But identity and log are testable.
> test_a <- cox.zph(fit, transform="log",global=FALSE)
> test_a12 <- cox.zph(fit12, transform="log",global=FALSE)
> test_a13 <- cox.zph(fit13, transform="log", global=FALSE)
> test_a23 <- cox.zph(fit23, transform="log", global=FALSE)
> aeq(test_a$y[test_a$strata==1, 1:2], test_a12$y)
[1] TRUE
>
> aeq(test_a$table[1:2,], test_a12$table)
[1] TRUE
> aeq(test_a$table[3:4,], test_a13$table)
[1] TRUE
> aeq(test_a$table[5:6,], test_a23$table)
[1] TRUE
>
> # check cox.zph fit - transform = 'identity'
> test_b <- cox.zph(fit, transform="identity",global=FALSE)
> test_b12 <- cox.zph(fit12, transform="identity",global=FALSE)
> test_b13 <- cox.zph(fit13, transform="identity", global=FALSE)
> test_b23 <- cox.zph(fit23, transform="identity", global=FALSE)
>
> aeq(test_b$table[1:2,], test_b12$table)
[1] TRUE
> aeq(test_b$table[3:4,], test_b13$table)
[1] TRUE
> aeq(test_b$table[5:6,], test_b23$table)
[1] TRUE
>
> # check out subscripting of a multi-state zph
> cname <- c("table", "x", "time", "y", "var")
> sapply(cname, function(x) aeq(test_b[1:2]$x, test_b12$x))
table x time y var
TRUE TRUE TRUE TRUE TRUE
> sapply(cname, function(x) aeq(test_b[3:4]$x, test_b13$x))
table x time y var
TRUE TRUE TRUE TRUE TRUE
> sapply(cname, function(x) aeq(test_b[5:6]$x, test_b23$x))
table x time y var
TRUE TRUE TRUE TRUE TRUE
>
> # check model.matrix
> mat1 <- model.matrix(fit)
> all.equal(mat1, fit$x)
[1] TRUE
>
> # Check that the internal matix agrees (uses stacker, which is not exported)
> mat2 <- model.matrix(fit12)
> mat3 <- model.matrix(fit13)
> mat4 <- model.matrix(fit23)
>
> # first reconstruct istate
> tcheck <- survcheck(Surv(tstart, tstop, event) ~ 1, tdata, id=id)
> temp <- survival:::stacker(fit$cmap, fit$smap, as.numeric(tcheck$istate), fit$x,
+ fit$y, NULL, fit$states)
> aeq(temp$X[temp$transition==1, 1:2], mat2)
[1] TRUE
> aeq(temp$X[temp$transition==2, 3:4], mat3)
[1] TRUE
> aeq(temp$X[temp$transition==3, 5:6], mat4)
[1] TRUE
>
>
>
> proc.time()
user system elapsed
1.314 0.113 1.428