Installation from CRAN:
install.packages("gfoRmulaICE")
Installation from GitHub repo:
devtools::install_github("CausalInference/gfoRmulaICE")
Please see the following for a few examples.
In this example, we illustrate how to specify dynamic intervention. We consider the following interventions, which are applied to all time points.
- Intervention 1 on A2: at time t, if L1 = 0, then treat; otherwise, not treat.
- Intervention 2 on A2: never treat upon until L1 = 0, after which follows always treat.
- Intervention 3 on A2: never treat upon until L1 = 0, after which follows natural course.
We use classical pooled ICE estimator and natural course as the reference intervention. We estimate variance using bootstrap with 1000 replicates, normal quantile, and parallel computing.
library(gfoRmulaICE)
ice_fit1 <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = F),
nsamples = 1000, ci_method = "percentile",
parallel = T, ncores = 5,
int_descript = c("Dynamic Intervention 1", "Dynamic Intervention 2", "Dynamic Intervention 3"),
intervention1.A2 = list(dynamic("L1 == 0", static(0), static(1))),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1), absorb = T)),
intervention3.A2 = list(dynamic("L1 == 0", static(0), natural_course()))
)
summary(ice_fit1)
plot(ice_fit1)
In this example, we illustrate the available intervention functions within the package. We consider the following interventions and apply to all time points.
- Intervention 1 on A1: always treat with value 3.
- Intervention 1 on A2: always treat with value 1.
- Intervention 2 on L2: when the natural value of L2 at time t is lower than -3, set its value to -3. Otherwise, do not intervene.
- Intervention 3 on A2: dynamic intervention (treat when L1 = 0) with uniform grace period of 2 periods.
We use classical pooled ICE estimator and natural course as the reference intervention. We estimate variance using bootstrap with 1000 replicates, normal quantile, and parallel computing.
ice_fit2 <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention", "Threshold Intervention", "Dynamic Intervention with Grace Period"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.L2 = list(threshold(-3, Inf)),
intervention3.A2 = list(grace_period("uniform", 2, "L1 == 0"))
)
summary(ice_fit2)
plot(ice_fit2)
In this example, we illustrate how to specify user-defined intervention. We consider the following interventions and apply to all time points.
- Intervention 1 on A1: at time t, if L2 < 0, then assign 1; if 0 <= L2 < 2, then assign 2; otherwise, assign 3.
We use classical pooled ICE estimator and natural course as the reference intervention. We estimate variance using bootstrap with 1000 replicates and percentile quantile.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit3 <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
competing_model = D ~ L1 + L2 + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Dynamic Intervention"),
intervention1.A1 = list(dynamic_cat)
)
summary(ice_fit3)
plot(ice_fit3)
In this example, we illustrate all available ICE estimators in the package. We consider the following interventions and apply to all time points.
- Intervention 1 on A1: always treat with value 3.
- Intervention 1 on A2: always treat with value 1.
- Intervention 2 on A1: at time t, if L2 < 0, then assign 1; if 0 <= L2 < 2, then assign 2; otherwise, assign 3.
- Intervention 2 on A2: at time t, if L1 = 0, then treat; otherwise, not treat.
We use natural course as the reference intervention and estimate variance using bootstrap with 1000 replicates and percentile quantile.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit4a <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
competing_model = D ~ L1 + L2 + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: classical pooled ICE",
"Dynamic Intervention: classical pooled ICE"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4a)
plot(ice_fit4a)
In case where the hazard model is the same as the outcome model, there is no need to specify hazard_model argument.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit4b <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
competing_model = D ~ L1 + L2 + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = T),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: hazard-based pooled ICE",
"Dynamic Intervention: hazard-based pooled ICE"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4b)
plot(ice_fit4b)
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit4c <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2,
censor_model = C ~ L1 + L2,
ref_idx = 0,
estimator = strat(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: classical stratified ICE",
"Dynamic Intervention: classical stratified ICE"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4c)
plot(ice_fit4c)
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit4d <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2,
censor_model = C ~ L1 + L2,
competing_model = D ~ L1 + L2,
hazard_model = Y ~ L1,
ref_idx = 0,
estimator = strat(hazard = T),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: hazard-based stratified ICE",
"Dynamic Intervention: hazard-based stratified ICE"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4d)
plot(ice_fit4d)
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit4e <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2,
censor_model = C ~ L1 + L2,
ref_idx = 0,
estimator = weight(list(A1 ~ L1 + L2, A2 ~ L1 + L2)),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: doubly robust ICE",
"Dynamic Intervention: doubly robust ICE"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4e)
plot(ice_fit4e)
In this example, we illustrate available options for specifying hazard model in hazard-based ICE estimators. We consider the same interventions in Example 4.
We allow pooled-over-time hazard model with flexible terms of time variable and time-specific hazard model in hazard-based pooled ICE. Note, in hazard-based stratified ICE, only time-specific hazard model is allowed.
To specify pooled-over-time hazard model in hazard-based pooled ICE, we set the global_hazard argument to r{TRUE}
. To specify time-specific hazard model in hazard-based pooled ICE, we set the global_hazard argument to r{FALSE}
, which is the default value. Example 4b illustrates the time-specific hazard model. We illustrate the pooled-over-time option in this example.
library(splines)
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit5 <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ L1 + L2 + A1 + A2,
censor_model = C ~ L1 + L2 + A1 + A2,
competing_model = D ~ L1 + L2 + A1 + A2,
hazard_model = Y ~ L1 + L2 + A1 + A2 + ns(t0, df = 2),
global_hazard = T,
ref_idx = 0,
estimator = pool(hazard = T),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: pooled-over-time",
"Dynamic Intervention: pooled-over-time"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit4b, ice_fit5)
plot(ice_fit4b, ice_fit5)
We allow users to specify intervention-specific models in stratified ICE and doubly robust ICE. We consider the same analysis in Example 4d but with intervention-specific models.
In this example, the outcome model for intervention 1 is Y ~ L1; The outcome model for intervention 2: Y ~ L1 + L2; The competing model for intervention 1: D ~ L1 + L2; The competing model for intervention 2: D ~ L1.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit6 <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
outcome_model = Y ~ L1,
censor_model = C ~ L1,
competing_model = D ~ L1,
comp_effect = 1,
ref_idx = 0,
estimator = strat(hazard = T),
nsamples = 1000,
ci_method = "normal",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention: intervention-specific model",
"Dynamic Intervention: intervention-specific model"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1))),
outcomeModel.1 = Y ~ L1 + L2,
compModel.2 = D ~ L1 + L2
)
summary(ice_fit4d, ice_fit6)
plot(ice_fit4d, ice_fit6)
In this example, we illustrate that including polynomial, spline, and lagged terms in model statements is supported. We consider the same interventions as in Example 4. We illustrate using the pooled ICE estimator.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit7a <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id", time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ I(L1^2) + rcspline.eval(lag1_L2, knots = 1:3) + A1 + A2,
censor_model = C ~ lag1_L1 + poly(L2, degree = 2) + A1 + A2,
ref_idx = 0,
estimator = pool(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention", "Dynamic Intervention"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit7a)
plot(ice_fit7a)
In this example, we use static intervention as the reference intervention. We consider the same interventions as in Example 4. We illustrate using the pooled ICE estimator.
dynamic_cat <- case_when(gfoRmulaICE::compData$L2 < 0 ~ 1,
gfoRmulaICE::compData$L2 >= 0 & gfoRmulaICE::compData$L2 < 2 ~ 2,
T ~ 3)
ice_fit7b <- ice(data = gfoRmulaICE::compData,
time_points = 4,
id = "id",
time_name = "t0",
censor_name = "C",
outcome_name = "Y",
compevent_name = "D",
comp_effect = 0,
outcome_model = Y ~ I(L1^2) + rcspline.eval(lag1_L2, knots = 1:3) + A1 + A2,
censor_model = C ~ lag1_L1 + poly(L2, degree = 2) + A1 + A2,
ref_idx = 1,
estimator = pool(hazard = F),
nsamples = 1000,
ci_method = "percentile",
parallel = T,
ncores = 5,
int_descript = c("Static Intervention", "Dynamic Intervention"),
intervention1.A1 = list(static(3)),
intervention1.A2 = list(static(1)),
intervention2.A1 = list(dynamic_cat),
intervention2.A2 = list(dynamic("L1 == 0", static(0), static(1)))
)
summary(ice_fit7b)
plot(ice_fit7b)