R version 4.4.0 RC (2024-04-16 r86458 ucrt) -- "Puppy Cup"
Copyright (C) 2024 The R Foundation for Statistical Computing
Platform: x86_64-w64-mingw32/x64

R is free software and comes with ABSOLUTELY NO WARRANTY.
You are welcome to redistribute it under certain conditions.
Type 'license()' or 'licence()' for distribution details.

R is a collaborative project with many contributors.
Type 'contributors()' for more information and
'citation()' on how to cite R or R packages in publications.

Type 'demo()' for some demos, 'help()' for on-line help, or
'help.start()' for an HTML browser interface to help.
Type 'q()' to quit R.

> library(survival)
> aeq <- function(x, y, ...) all.equal(as.vector(x), as.vector(y), ...)
> 
> # Check that a multi-state model, correctly set up, gives the same
> # solution as a time-dependent covariate.
> # This is a stronger test than mstrata: there the covariate which was mapped
> #  into a state was constant, here it is time-dependent.
> #
> # First build the TD data set from pbcseq, with a categorical bilirubin
> pbc1 <- pbcseq
> pbc1$bili4 <- cut(pbc1$bili, c(0,1, 2,4, 100), 
+                   c("normal", "1-2x", "2-4x", ">4"))
> ptemp <- subset(pbc1, !duplicated(id))  # first row of each
> 
> pbc2 <- tmerge(ptemp[, c("id", "age", "sex")], ptemp, id,
+                death= event(futime, status==2))
> 
> pbc2 <- tmerge(pbc2, pbc1, id=id, bili = tdc(day, bili),
+                  bili4 = tdc(day, bili4), bstat = event(day, as.numeric(bili4)))
> btemp <- with(pbc2, ifelse(death, 5, bstat))
> 
> # a row with the same starting and ending bili4 level is not an event
> b2 <- ifelse(((as.numeric(pbc2$bili4)) == btemp), 0, btemp)
> pbc2$bstat <- factor(b2, 0:5,
+                      c("censor", "normal", "1-2x", "2-4x", ">4", "death"))
> check1 <- survcheck(Surv(tstart, tstop, bstat) ~ 1, istate= bili4,
+                     id = id, data=pbc2)
> check1$transitions
        to
from     normal 1-2x 2-4x  >4 death (censored)
  normal      0   81   10   3     9         77
  1-2x       61    0   68  15     9         36
  2-4x        2   33    0  94    12         24
  >4          1    3   28   0   110         35
  death       0    0    0   0     0          0
> all.equal(as.character(pbc2$bili4), as.character(check1$istate))
[1] TRUE
> # the above verifies that I created the data set correctly
> 
> # Standard coxph fit with a time dependent bili4 variable.
> fit1 <- coxph(Surv(tstart, tstop, death) ~ age + bili4, pbc2)
> 
> # An additive multi-state fit, where bili4 is a state
> #  The three forms below should all give identical models
> fit2 <- coxph(list(Surv(tstart, tstop, bstat) ~ 1,
+                    c(1:4):5 ~ age / common + shared), id= id, istate=bili4,
+               data=pbc2)
> fit2b <- coxph(list(Surv(tstart, tstop, bstat) ~ 1,
+                    1:5 + 2:5 + 3:5 + 4:5 ~ age / common + shared), 
+               id= id, istate=bili4, data=pbc2)
> fit2c <- coxph(list(Surv(tstart, tstop, bstat) ~ 1,
+                    0:5 ~ age / common + shared), 
+               id= id, istate=bili4, data=pbc2)
> 
> # Make sure the names are correct and the coefficients match
> aeq(coef(fit1), coef(fit2))
[1] TRUE
> aeq(names(coef(fit2)), c("age", "ph(2:5/1:5)", "ph(3:5/1:5)", "ph(4:5/1:5)"))
[1] TRUE
> all.equal(coef(fit2), coef(fit2b))
[1] TRUE
> all.equal(coef(fit2), coef(fit2c))
[1] TRUE
> 
> # Now a model with a separate age effect for each bilirubin group
> fit3  <- coxph(Surv(tstart, tstop, death) ~ age*bili4, pbc2)
> fit3b <- coxph(Surv(tstart, tstop, death) ~ bili4/age, pbc2)
> fit4 <-  coxph(list(Surv(tstart, tstop, bstat) ~ 1,
+                    c(1:4):5 ~ age / shared), id= id, istate=bili4,
+               data=pbc2)
> all.equal(fit3$loglik, fit3b$loglik)
[1] TRUE
> all.equal(fit3$loglik, fit4$loglik)
[1] TRUE
> 
> # The coefficients are quite different due to different codings for dummy vars
> # Unpack the interaction, first 4 coefs will be the age effect within each
> #  bilirubin group
> temp <- c(coef(fit3)[1] + c(0, coef(fit3)[5:7]), coef(fit3)[2:4])
> names(temp)[1:4] <- c("age1", "age2", "age3", "age4")
> aeq(temp, coef(fit3b)[c(4:7, 1:3)])
[1] TRUE
> aeq(temp, coef(fit4))
[1] TRUE
> 
> # Third, a model with separate baseline hazards for each bili group
> fit5 <- coxph(Surv(tstart, tstop, death) ~ strata(bili4)/age, pbc2,
+               cluster=id)
> fit6 <- coxph(list(Surv(tstart, tstop, bstat) ~ 1, 0:5 ~ age),
+                    id=id, istate=bili4, pbc2)
> aeq(coef(fit5), coef(fit6))
[1] TRUE
> aeq(fit5$var, fit6$var)
[1] TRUE
> aeq(fit5$naive.var, fit6$naive.var)
[1] TRUE
> 
> proc.time()
   user  system elapsed 
   1.23    0.12    1.29