CircosHeatmap-aardio/dist/lib/r/site-library/survival/tests/book5.R

library(survival)
options(na.action=na.exclude) # preserve missings
options(contrasts=c('contr.treatment', 'contr.poly')) #ensure constrast type

# Tests of the weighted Cox model
#  This is section 1.3 of my appendix -- not yet found in the book
#  though, it awaits the next edition
#
# Similar data set to test1, but add weights,
#                                    a double-death/censor tied time
#                                    a censored last subject
# The latter two are cases covered only feebly elsewhere.
# 
# The data set testw2 has the same data, but done via replication
#
aeq <- function(x,y) all.equal(as.vector(x), as.vector(y))

testw1 <- data.frame(time=  c(1,1,2,2,2,2,3,4,5),
		    status= c(1,0,1,1,1,0,0,1,0),
		    x=      c(2,0,1,1,0,1,0,1,0),
		    wt =    c(1,2,3,4,3,2,1,2,1),
                    id =    1:9)
# Expanded data set
testw2 <- testw1[rep(1:9, testw1$wt), -4]
row.names(testw2) <- NULL
indx <- match(1:9, testw2$id)

# Breslow estimate
byhand <- function(beta, newx=0) {
    r <- exp(beta)
    loglik <- 11*beta - (log(r^2 + 11*r +7) + 10*log(11*r +5) +2*log(2*r+1))
    hazard <- c(1/(r^2 + 11*r +7), 10/(11*r +5), 2/(2*r+1))
    xbar <- c((2*r^2 + 11*r)*hazard[1], 11*r/(11*r +5), r*hazard[3])
    U <- 11- (xbar[1] + 10*xbar[2] + 2*xbar[3])
    imat <- (4*r^2 + 11*r)*hazard[1] - xbar[1]^2 +
            10*(xbar[2] - xbar[2]^2) + 2*(xbar[3] - xbar[3]^2)

    temp <- cumsum(hazard)
    risk <- c(r^2, 1,r,r,1,r,1,r,1)
    expected <- risk* temp[c(1,1,2,2,2,2,2,3,3)]
    
    # The matrix of weights, one row per obs, one col per death
    #   deaths at 1,2,2,2, and 4
    riskmat <- matrix(c(1,1,1,1,1,1,1,1,1,
                        0,0,1,1,1,1,1,1,1,
                        0,0,1,1,1,1,1,1,1,
                        0,0,1,1,1,1,1,1,1,
                        0,0,0,0,0,0,0,1,1), ncol=5)
    wtmat <- diag(c(r^2, 2, 3*r, 4*r, 3, 2*r, 1, 2*r, 1)) %*% riskmat

    x      <- c(2,0,1,1,0,1,0,1,0)
    status <- c(1,0,1,1,1,0,0,1,0)
    wt     <- c(1,2,3,4,3,2,1,2,1)
   # Table of sums for score and Schoenfeld resids
    hazmat <- riskmat %*% diag(c(1,3,4,3,2)/colSums(wtmat)) 
    dM <- -risk*hazmat  #Expected part
    dM[1,1] <- dM[1,1] +1  # deaths at time 1
    for (i in 2:4) dM[i+1, i] <- dM[i+1,i] +1
    dM[8,5] <- dM[8,5] +1
    mart <- rowSums(dM)
    resid <-dM * outer(x, xbar[c(1,2,2,2,3)] ,'-')

    # Increments to the variance of the hazard
    var.g <- cumsum(hazard^2/ c(1,10,2))
    var.d <- cumsum((xbar-newx)*hazard)

    list(loglik=loglik, U=U, imat=imat, hazard=hazard, xbar=xbar,
         mart=c(1,0,1,1,1,0,0,1,0)-expected, expected=expected,
         score=rowSums(resid), schoen=c(2,1,1,0,1) - xbar[c(1,2,2,2,3)],
         varhaz=(var.g + var.d^2/imat)* exp(2*beta*newx))
    }

aeq(byhand(0)$expected, c(1/19, 1/19, rep(103/152, 5), rep(613/456,2))) #verify 

fit0 <- coxph(Surv(time, status) ~x, testw1, weights=wt,
		    method='breslow', iter=0)
fit0b <- coxph(Surv(time, status) ~x, testw2, method='breslow', iter=0)
fit  <- coxph(Surv(time, status) ~x, testw1, weights=wt, method='breslow')
fitb <- coxph(Surv(time, status) ~x, testw2, method='breslow')

aeq(resid(fit0, type='mart'), (resid(fit0b, type='mart'))[indx])
aeq(resid(fit0, type='scor'), (resid(fit0b, type='scor'))[indx])
aeq(unique(resid(fit0, type='scho')), unique(resid(fit0b, type='scho')))

truth0 <- byhand(0,pi)
aeq(fit0$loglik[1], truth0$loglik)
aeq(1/truth0$imat, fit0$var)
aeq(truth0$mart, fit0$residuals)
aeq(truth0$schoen, resid(fit0, 'schoen'))
aeq(truth0$score, resid(fit0, 'score')) 
sfit <- survfit(fit0, list(x=pi), censor=FALSE)
aeq(sfit$std.err^2, truth0$varhaz)
aeq(-log(sfit$surv), cumsum(truth0$hazard))

truth <- byhand(0.85955744, .3)
aeq(truth$loglik, fit$loglik[2])
aeq(1/truth$imat, fit$var)
aeq(truth$mart, fit$residuals)
aeq(truth$schoen, resid(fit, 'schoen'))
aeq(truth$score, resid(fit, 'score'))

sfit <- survfit(fit, list(x=.3), censor=FALSE)
aeq(sfit$std.err^2, truth$varhaz) 
aeq(-log(sfit$surv), (cumsum(truth$hazard)* exp(fit$coefficients*.3)))


fit0
summary(fit)
resid(fit0, type='score')
resid(fit0, type='scho')

resid(fit, type='score')
resid(fit, type='scho')
aeq(resid(fit, type='mart'), (resid(fitb, type='mart'))[indx])
aeq(resid(fit, type='scor'), (resid(fitb, type='scor'))[indx])
aeq(unique(resid(fit, type='scho')), unique(resid(fitb, type='scho')))
rr1 <- resid(fit, type='mart')
rr2 <- resid(fit, type='mart', weighted=T)
aeq(rr2/rr1, testw1$wt)

rr1 <- resid(fit, type='score')
rr2 <- resid(fit, type='score', weighted=T)
aeq(rr2/rr1, testw1$wt)
首次上传 2025-01-12 00:52:51 +08:00			`library(survival)`
			`options(na.action=na.exclude) # preserve missings`
			`options(contrasts=c('contr.treatment', 'contr.poly')) #ensure constrast type`

			`# Tests of the weighted Cox model`
			`# This is section 1.3 of my appendix -- not yet found in the book`
			`# though, it awaits the next edition`
			`#`
			`# Similar data set to test1, but add weights,`
			`# a double-death/censor tied time`
			`# a censored last subject`
			`# The latter two are cases covered only feebly elsewhere.`
			`#`
			`# The data set testw2 has the same data, but done via replication`
			`#`
			`aeq <- function(x,y) all.equal(as.vector(x), as.vector(y))`

			`testw1 <- data.frame(time= c(1,1,2,2,2,2,3,4,5),`
			`status= c(1,0,1,1,1,0,0,1,0),`
			`x= c(2,0,1,1,0,1,0,1,0),`
			`wt = c(1,2,3,4,3,2,1,2,1),`
			`id = 1:9)`
			`# Expanded data set`
			`testw2 <- testw1[rep(1:9, testw1$wt), -4]`
			`row.names(testw2) <- NULL`
			`indx <- match(1:9, testw2$id)`

			`# Breslow estimate`
			`byhand <- function(beta, newx=0) {`
			`r <- exp(beta)`
			`loglik <- 11beta - (log(r^2 + 11r +7) + 10log(11r +5) +2log(2r+1))`
			`hazard <- c(1/(r^2 + 11r +7), 10/(11r +5), 2/(2*r+1))`
			`xbar <- c((2r^2 + 11r)hazard[1], 11r/(11r +5), rhazard[3])`
			`U <- 11- (xbar[1] + 10xbar[2] + 2xbar[3])`
			`imat <- (4r^2 + 11r)*hazard[1] - xbar[1]^2 +`
			`10(xbar[2] - xbar[2]^2) + 2(xbar[3] - xbar[3]^2)`

			`temp <- cumsum(hazard)`
			`risk <- c(r^2, 1,r,r,1,r,1,r,1)`
			`expected <- risk* temp[c(1,1,2,2,2,2,2,3,3)]`

			`# The matrix of weights, one row per obs, one col per death`
			`# deaths at 1,2,2,2, and 4`
			`riskmat <- matrix(c(1,1,1,1,1,1,1,1,1,`
			`0,0,1,1,1,1,1,1,1,`
			`0,0,1,1,1,1,1,1,1,`
			`0,0,1,1,1,1,1,1,1,`
			`0,0,0,0,0,0,0,1,1), ncol=5)`
			`wtmat <- diag(c(r^2, 2, 3r, 4r, 3, 2r, 1, 2r, 1)) %*% riskmat`

			`x <- c(2,0,1,1,0,1,0,1,0)`
			`status <- c(1,0,1,1,1,0,0,1,0)`
			`wt <- c(1,2,3,4,3,2,1,2,1)`
			`# Table of sums for score and Schoenfeld resids`
			`hazmat <- riskmat %*% diag(c(1,3,4,3,2)/colSums(wtmat))`
			`dM <- -risk*hazmat #Expected part`
			`dM[1,1] <- dM[1,1] +1 # deaths at time 1`
			`for (i in 2:4) dM[i+1, i] <- dM[i+1,i] +1`
			`dM[8,5] <- dM[8,5] +1`
			`mart <- rowSums(dM)`
			`resid <-dM * outer(x, xbar[c(1,2,2,2,3)] ,'-')`

			`# Increments to the variance of the hazard`
			`var.g <- cumsum(hazard^2/ c(1,10,2))`
			`var.d <- cumsum((xbar-newx)*hazard)`

			`list(loglik=loglik, U=U, imat=imat, hazard=hazard, xbar=xbar,`
			`mart=c(1,0,1,1,1,0,0,1,0)-expected, expected=expected,`
			`score=rowSums(resid), schoen=c(2,1,1,0,1) - xbar[c(1,2,2,2,3)],`
			`varhaz=(var.g + var.d^2/imat)* exp(2betanewx))`
			`}`

			`aeq(byhand(0)$expected, c(1/19, 1/19, rep(103/152, 5), rep(613/456,2))) #verify`

			`fit0 <- coxph(Surv(time, status) ~x, testw1, weights=wt,`
			`method='breslow', iter=0)`
			`fit0b <- coxph(Surv(time, status) ~x, testw2, method='breslow', iter=0)`
			`fit <- coxph(Surv(time, status) ~x, testw1, weights=wt, method='breslow')`
			`fitb <- coxph(Surv(time, status) ~x, testw2, method='breslow')`

			`aeq(resid(fit0, type='mart'), (resid(fit0b, type='mart'))[indx])`
			`aeq(resid(fit0, type='scor'), (resid(fit0b, type='scor'))[indx])`
			`aeq(unique(resid(fit0, type='scho')), unique(resid(fit0b, type='scho')))`

			`truth0 <- byhand(0,pi)`
			`aeq(fit0$loglik[1], truth0$loglik)`
			`aeq(1/truth0$imat, fit0$var)`
			`aeq(truth0$mart, fit0$residuals)`
			`aeq(truth0$schoen, resid(fit0, 'schoen'))`
			`aeq(truth0$score, resid(fit0, 'score'))`
			`sfit <- survfit(fit0, list(x=pi), censor=FALSE)`
			`aeq(sfit$std.err^2, truth0$varhaz)`
			`aeq(-log(sfit$surv), cumsum(truth0$hazard))`

			`truth <- byhand(0.85955744, .3)`
			`aeq(truth$loglik, fit$loglik[2])`
			`aeq(1/truth$imat, fit$var)`
			`aeq(truth$mart, fit$residuals)`
			`aeq(truth$schoen, resid(fit, 'schoen'))`
			`aeq(truth$score, resid(fit, 'score'))`

			`sfit <- survfit(fit, list(x=.3), censor=FALSE)`
			`aeq(sfit$std.err^2, truth$varhaz)`
			`aeq(-log(sfit$surv), (cumsum(truth$hazard)* exp(fit$coefficients*.3)))`


			`fit0`
			`summary(fit)`
			`resid(fit0, type='score')`
			`resid(fit0, type='scho')`

			`resid(fit, type='score')`
			`resid(fit, type='scho')`
			`aeq(resid(fit, type='mart'), (resid(fitb, type='mart'))[indx])`
			`aeq(resid(fit, type='scor'), (resid(fitb, type='scor'))[indx])`
			`aeq(unique(resid(fit, type='scho')), unique(resid(fitb, type='scho')))`
			`rr1 <- resid(fit, type='mart')`
			`rr2 <- resid(fit, type='mart', weighted=T)`
			`aeq(rr2/rr1, testw1$wt)`

			`rr1 <- resid(fit, type='score')`
			`rr2 <- resid(fit, type='score', weighted=T)`
			`aeq(rr2/rr1, testw1$wt)`